Path: blob/master/thirdparty/glslang/SPIRV/GlslangToSpv.cpp
21917 views
//1// Copyright (C) 2014-2016 LunarG, Inc.2// Copyright (C) 2015-2020 Google, Inc.3// Copyright (C) 2017, 2022-2025 Arm Limited.4// Modifications Copyright (C) 2020 Advanced Micro Devices, Inc. All rights reserved.5//6// All rights reserved.7//8// Redistribution and use in source and binary forms, with or without9// modification, are permitted provided that the following conditions10// are met:11//12// Redistributions of source code must retain the above copyright13// notice, this list of conditions and the following disclaimer.14//15// Redistributions in binary form must reproduce the above16// copyright notice, this list of conditions and the following17// disclaimer in the documentation and/or other materials provided18// with the distribution.19//20// Neither the name of 3Dlabs Inc. Ltd. nor the names of its21// contributors may be used to endorse or promote products derived22// from this software without specific prior written permission.23//24// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS25// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT26// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS27// FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE28// COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,29// INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,30// BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;31// LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER32// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT33// LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN34// ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE35// POSSIBILITY OF SUCH DAMAGE.3637//38// Visit the nodes in the glslang intermediate tree representation to39// translate them to SPIR-V.40//4142#include "spirv.hpp11"43#include "GlslangToSpv.h"44#include "SpvBuilder.h"45#include "SpvTools.h"46#include "spvUtil.h"4748namespace spv {49#include "GLSL.std.450.h"50#include "GLSL.ext.KHR.h"51#include "GLSL.ext.EXT.h"52#include "GLSL.ext.AMD.h"53#include "GLSL.ext.NV.h"54#include "GLSL.ext.ARM.h"55#include "GLSL.ext.QCOM.h"56#include "NonSemanticDebugPrintf.h"57}5859// Glslang includes60#include "../glslang/MachineIndependent/localintermediate.h"61#include "../glslang/MachineIndependent/SymbolTable.h"62#include "../glslang/Include/Common.h"6364// Build-time generated includes65#include "glslang/build_info.h"6667#include <fstream>68#include <iomanip>69#include <list>70#include <map>71#include <optional>72#include <stack>73#include <string>74#include <vector>7576namespace {7778namespace {79class SpecConstantOpModeGuard {80public:81SpecConstantOpModeGuard(spv::Builder* builder)82: builder_(builder) {83previous_flag_ = builder->isInSpecConstCodeGenMode();84}85~SpecConstantOpModeGuard() {86previous_flag_ ? builder_->setToSpecConstCodeGenMode()87: builder_->setToNormalCodeGenMode();88}89void turnOnSpecConstantOpMode() {90builder_->setToSpecConstCodeGenMode();91}9293private:94spv::Builder* builder_;95bool previous_flag_;96};9798struct OpDecorations {99public:100OpDecorations(spv::Decoration precision, spv::Decoration noContraction, spv::Decoration nonUniform) :101precision(precision)102,103noContraction(noContraction),104nonUniform(nonUniform)105{ }106107spv::Decoration precision;108109void addNoContraction(spv::Builder& builder, spv::Id t) { builder.addDecoration(t, noContraction); }110void addNonUniform(spv::Builder& builder, spv::Id t) { builder.addDecoration(t, nonUniform); }111protected:112spv::Decoration noContraction;113spv::Decoration nonUniform;114};115116} // namespace117118//119// The main holder of information for translating glslang to SPIR-V.120//121// Derives from the AST walking base class.122//123class TGlslangToSpvTraverser : public glslang::TIntermTraverser {124public:125TGlslangToSpvTraverser(unsigned int spvVersion, const glslang::TIntermediate*, spv::SpvBuildLogger* logger,126glslang::SpvOptions& options);127virtual ~TGlslangToSpvTraverser() { }128129bool visitAggregate(glslang::TVisit, glslang::TIntermAggregate*) override;130bool visitBinary(glslang::TVisit, glslang::TIntermBinary*) override;131void visitConstantUnion(glslang::TIntermConstantUnion*) override;132bool visitSelection(glslang::TVisit, glslang::TIntermSelection*) override;133bool visitSwitch(glslang::TVisit, glslang::TIntermSwitch*) override;134void visitSymbol(glslang::TIntermSymbol* symbol) override;135bool visitUnary(glslang::TVisit, glslang::TIntermUnary*) override;136bool visitLoop(glslang::TVisit, glslang::TIntermLoop*) override;137bool visitBranch(glslang::TVisit visit, glslang::TIntermBranch*) override;138bool visitVariableDecl(glslang::TVisit, glslang::TIntermVariableDecl*) override;139140void finishSpv(bool compileOnly);141void dumpSpv(std::vector<unsigned int>& out);142143protected:144TGlslangToSpvTraverser(TGlslangToSpvTraverser&);145TGlslangToSpvTraverser& operator=(TGlslangToSpvTraverser&);146147spv::Decoration TranslateInterpolationDecoration(const glslang::TQualifier& qualifier);148spv::Decoration TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier);149spv::Decoration TranslateNonUniformDecoration(const glslang::TQualifier& qualifier);150spv::Decoration TranslateNonUniformDecoration(const spv::Builder::AccessChain::CoherentFlags& coherentFlags);151spv::Builder::AccessChain::CoherentFlags TranslateCoherent(const glslang::TType& type);152spv::MemoryAccessMask TranslateMemoryAccess(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);153spv::ImageOperandsMask TranslateImageOperands(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);154spv::Scope TranslateMemoryScope(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);155spv::BuiltIn TranslateBuiltInDecoration(glslang::TBuiltInVariable, bool memberDeclaration);156spv::ImageFormat TranslateImageFormat(const glslang::TType& type);157spv::SelectionControlMask TranslateSelectionControl(const glslang::TIntermSelection&) const;158spv::SelectionControlMask TranslateSwitchControl(const glslang::TIntermSwitch&) const;159spv::LoopControlMask TranslateLoopControl(const glslang::TIntermLoop&, std::vector<unsigned int>& operands) const;160spv::StorageClass TranslateStorageClass(const glslang::TType&);161void TranslateLiterals(const glslang::TVector<const glslang::TIntermConstantUnion*>&, std::vector<unsigned>&) const;162void addIndirectionIndexCapabilities(const glslang::TType& baseType, const glslang::TType& indexType);163spv::Id createSpvVariable(const glslang::TIntermSymbol*, spv::Id forcedType);164spv::Id getSampledType(const glslang::TSampler&);165spv::Id getInvertedSwizzleType(const glslang::TIntermTyped&);166spv::Id createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped&, spv::Id parentResult);167void convertSwizzle(const glslang::TIntermAggregate&, std::vector<unsigned>& swizzle);168spv::Id convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly = false);169spv::Id convertGlslangToSpvType(const glslang::TType& type, glslang::TLayoutPacking, const glslang::TQualifier&,170bool lastBufferBlockMember, bool forwardReferenceOnly = false);171void applySpirvDecorate(const glslang::TType& type, spv::Id id, std::optional<int> member);172bool filterMember(const glslang::TType& member);173spv::Id convertGlslangStructToSpvType(const glslang::TType&, const glslang::TTypeList* glslangStruct,174glslang::TLayoutPacking, const glslang::TQualifier&);175spv::LinkageType convertGlslangLinkageToSpv(glslang::TLinkType glslangLinkType);176void decorateStructType(const glslang::TType&, const glslang::TTypeList* glslangStruct, glslang::TLayoutPacking,177const glslang::TQualifier&, spv::Id, const std::vector<spv::Id>& spvMembers);178spv::Id makeArraySizeId(const glslang::TArraySizes&, int dim, bool allowZero = false, bool boolType = false);179spv::Id accessChainLoad(const glslang::TType& type);180void accessChainStore(const glslang::TType& type, spv::Id rvalue);181void multiTypeStore(const glslang::TType&, spv::Id rValue);182spv::Id convertLoadedBoolInUniformToUint(const glslang::TType& type, spv::Id nominalTypeId, spv::Id loadedId);183glslang::TLayoutPacking getExplicitLayout(const glslang::TType& type) const;184int getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking, glslang::TLayoutMatrix);185int getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking, glslang::TLayoutMatrix);186void updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType, int& currentOffset,187int& nextOffset, glslang::TLayoutPacking, glslang::TLayoutMatrix);188void declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember);189190bool isShaderEntryPoint(const glslang::TIntermAggregate* node);191bool writableParam(glslang::TStorageQualifier) const;192bool originalParam(glslang::TStorageQualifier, const glslang::TType&, bool implicitThisParam);193void makeFunctions(const glslang::TIntermSequence&);194void makeGlobalInitializers(const glslang::TIntermSequence&);195void collectRayTracingLinkerObjects();196void visitFunctions(const glslang::TIntermSequence&);197void translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments,198spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags);199void translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments);200spv::Id createImageTextureFunctionCall(glslang::TIntermOperator* node);201spv::Id handleUserFunctionCall(const glslang::TIntermAggregate*);202203spv::Id createBinaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right,204glslang::TBasicType typeProxy, bool reduceComparison = true);205spv::Id createBinaryMatrixOperation(spv::Op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right);206spv::Id createUnaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id operand,207glslang::TBasicType typeProxy,208const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,209const glslang::TType &opType);210spv::Id createUnaryMatrixOperation(spv::Op op, OpDecorations&, spv::Id typeId, spv::Id operand,211glslang::TBasicType typeProxy);212spv::Id createConversion(glslang::TOperator op, OpDecorations&, spv::Id destTypeId, spv::Id operand,213glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType);214spv::Id createIntWidthConversion(spv::Id operand, int vectorSize, spv::Id destType,215glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType);216spv::Id makeSmearedConstant(spv::Id constant, int vectorSize);217spv::Id createAtomicOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId,218std::vector<spv::Id>& operands, glslang::TBasicType typeProxy,219const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,220const glslang::TType &opType);221spv::Id createInvocationsOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands,222glslang::TBasicType typeProxy);223spv::Id CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,224spv::Id typeId, std::vector<spv::Id>& operands);225spv::Id createSubgroupOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands,226glslang::TBasicType typeProxy);227spv::Id createMiscOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId,228std::vector<spv::Id>& operands, glslang::TBasicType typeProxy);229spv::Id createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId);230spv::Id getSymbolId(const glslang::TIntermSymbol* node);231void addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier & qualifier);232bool hasQCOMImageProceessingDecoration(spv::Id id, spv::Decoration decor);233void addImageProcessingQCOMDecoration(spv::Id id, spv::Decoration decor);234void addImageProcessing2QCOMDecoration(spv::Id id, bool isForGather);235spv::Id createSpvConstant(const glslang::TIntermTyped&);236spv::Id createSpvConstantFromConstUnionArray(const glslang::TType& type, const glslang::TConstUnionArray&,237int& nextConst, bool specConstant);238bool isTrivialLeaf(const glslang::TIntermTyped* node);239bool isTrivial(const glslang::TIntermTyped* node);240spv::Id createShortCircuit(glslang::TOperator, glslang::TIntermTyped& left, glslang::TIntermTyped& right);241spv::Id getExtBuiltins(const char* name);242std::pair<spv::Id, spv::Id> getForcedType(glslang::TBuiltInVariable builtIn, const glslang::TType&);243spv::Id translateForcedType(spv::Id object);244spv::Id createCompositeConstruct(spv::Id typeId, std::vector<spv::Id> constituents);245246glslang::SpvOptions& options;247spv::Function* shaderEntry;248spv::Function* currentFunction;249spv::Instruction* entryPoint;250int sequenceDepth;251252spv::SpvBuildLogger* logger;253254// There is a 1:1 mapping between a spv builder and a module; this is thread safe255spv::Builder builder;256bool inEntryPoint;257bool entryPointTerminated;258bool linkageOnly; // true when visiting the set of objects in the AST present only for259// establishing interface, whether or not they were statically used260std::set<spv::Id> iOSet; // all input/output variables from either static use or declaration of interface261const glslang::TIntermediate* glslangIntermediate;262bool nanMinMaxClamp; // true if use NMin/NMax/NClamp instead of FMin/FMax/FClamp263spv::Id stdBuiltins;264spv::Id nonSemanticDebugPrintf;265std::unordered_map<std::string, spv::Id> extBuiltinMap;266267std::unordered_map<long long, spv::Id> symbolValues;268std::unordered_map<uint32_t, spv::Id> builtInVariableIds;269std::unordered_set<long long> rValueParameters; // set of formal function parameters passed as rValues,270// rather than a pointer271std::unordered_map<std::string, spv::Function*> functionMap;272std::unordered_map<const glslang::TTypeList*, spv::Id> structMap[glslang::ElpCount][glslang::ElmCount];273// for mapping glslang block indices to spv indices (e.g., due to hidden members):274std::unordered_map<long long, std::vector<int>> memberRemapper;275// for mapping glslang symbol struct to symbol Id276std::unordered_map<const glslang::TTypeList*, long long> glslangTypeToIdMap;277std::stack<bool> breakForLoop; // false means break for switch278std::unordered_map<std::string, const glslang::TIntermSymbol*> counterOriginator;279// Map pointee types for EbtReference to their forward pointers280std::map<const glslang::TType *, spv::Id> forwardPointers;281// Type forcing, for when SPIR-V wants a different type than the AST,282// requiring local translation to and from SPIR-V type on every access.283// Maps <builtin-variable-id -> AST-required-type-id>284std::unordered_map<spv::Id, spv::Id> forceType;285// Used by Task shader while generating opearnds for OpEmitMeshTasksEXT286spv::Id taskPayloadID;287// Used later for generating OpTraceKHR/OpExecuteCallableKHR/OpHitObjectRecordHit*/OpHitObjectGetShaderBindingTableData288std::unordered_map<unsigned int, glslang::TIntermSymbol *> locationToSymbol[4];289std::unordered_map<spv::Id, std::vector<spv::Decoration> > idToQCOMDecorations;290};291292//293// Helper functions for translating glslang representations to SPIR-V enumerants.294//295296// Translate glslang profile to SPIR-V source language.297spv::SourceLanguage TranslateSourceLanguage(glslang::EShSource source, EProfile profile)298{299switch (source) {300case glslang::EShSourceGlsl:301switch (profile) {302case ENoProfile:303case ECoreProfile:304case ECompatibilityProfile:305return spv::SourceLanguage::GLSL;306case EEsProfile:307return spv::SourceLanguage::ESSL;308default:309return spv::SourceLanguage::Unknown;310}311case glslang::EShSourceHlsl:312return spv::SourceLanguage::HLSL;313default:314return spv::SourceLanguage::Unknown;315}316}317318// Translate glslang language (stage) to SPIR-V execution model.319spv::ExecutionModel TranslateExecutionModel(EShLanguage stage, bool isMeshShaderEXT = false)320{321switch (stage) {322case EShLangVertex: return spv::ExecutionModel::Vertex;323case EShLangFragment: return spv::ExecutionModel::Fragment;324case EShLangCompute: return spv::ExecutionModel::GLCompute;325case EShLangTessControl: return spv::ExecutionModel::TessellationControl;326case EShLangTessEvaluation: return spv::ExecutionModel::TessellationEvaluation;327case EShLangGeometry: return spv::ExecutionModel::Geometry;328case EShLangRayGen: return spv::ExecutionModel::RayGenerationKHR;329case EShLangIntersect: return spv::ExecutionModel::IntersectionKHR;330case EShLangAnyHit: return spv::ExecutionModel::AnyHitKHR;331case EShLangClosestHit: return spv::ExecutionModel::ClosestHitKHR;332case EShLangMiss: return spv::ExecutionModel::MissKHR;333case EShLangCallable: return spv::ExecutionModel::CallableKHR;334case EShLangTask: return (isMeshShaderEXT)? spv::ExecutionModel::TaskEXT : spv::ExecutionModel::TaskNV;335case EShLangMesh: return (isMeshShaderEXT)? spv::ExecutionModel::MeshEXT : spv::ExecutionModel::MeshNV;336default:337assert(0);338return spv::ExecutionModel::Fragment;339}340}341342// Translate glslang sampler type to SPIR-V dimensionality.343spv::Dim TranslateDimensionality(const glslang::TSampler& sampler)344{345switch (sampler.dim) {346case glslang::Esd1D: return spv::Dim::Dim1D;347case glslang::Esd2D: return spv::Dim::Dim2D;348case glslang::Esd3D: return spv::Dim::Dim3D;349case glslang::EsdCube: return spv::Dim::Cube;350case glslang::EsdRect: return spv::Dim::Rect;351case glslang::EsdBuffer: return spv::Dim::Buffer;352case glslang::EsdSubpass: return spv::Dim::SubpassData;353case glslang::EsdAttachmentEXT: return spv::Dim::TileImageDataEXT;354default:355assert(0);356return spv::Dim::Dim2D;357}358}359360// Translate glslang precision to SPIR-V precision decorations.361spv::Decoration TranslatePrecisionDecoration(glslang::TPrecisionQualifier glslangPrecision)362{363switch (glslangPrecision) {364case glslang::EpqLow: return spv::Decoration::RelaxedPrecision;365case glslang::EpqMedium: return spv::Decoration::RelaxedPrecision;366default:367return spv::NoPrecision;368}369}370371// Translate glslang type to SPIR-V precision decorations.372spv::Decoration TranslatePrecisionDecoration(const glslang::TType& type)373{374return TranslatePrecisionDecoration(type.getQualifier().precision);375}376377// Translate glslang type to SPIR-V block decorations.378spv::Decoration TranslateBlockDecoration(const glslang::TStorageQualifier storage, bool useStorageBuffer)379{380switch (storage) {381case glslang::EvqUniform: return spv::Decoration::Block;382case glslang::EvqBuffer: return useStorageBuffer ? spv::Decoration::Block : spv::Decoration::BufferBlock;383case glslang::EvqVaryingIn: return spv::Decoration::Block;384case glslang::EvqVaryingOut: return spv::Decoration::Block;385case glslang::EvqShared: return spv::Decoration::Block;386case glslang::EvqPayload: return spv::Decoration::Block;387case glslang::EvqPayloadIn: return spv::Decoration::Block;388case glslang::EvqHitAttr: return spv::Decoration::Block;389case glslang::EvqCallableData: return spv::Decoration::Block;390case glslang::EvqCallableDataIn: return spv::Decoration::Block;391case glslang::EvqHitObjectAttrNV: return spv::Decoration::Block;392case glslang::EvqHitObjectAttrEXT: return spv::Decoration::Block;393default:394assert(0);395break;396}397398return spv::Decoration::Max;399}400401// Translate glslang type to SPIR-V memory decorations.402void TranslateMemoryDecoration(const glslang::TQualifier& qualifier, std::vector<spv::Decoration>& memory,403bool useVulkanMemoryModel)404{405if (!useVulkanMemoryModel) {406if (qualifier.isVolatile()) {407memory.push_back(spv::Decoration::Volatile);408memory.push_back(spv::Decoration::Coherent);409} else if (qualifier.isCoherent()) {410memory.push_back(spv::Decoration::Coherent);411}412}413if (qualifier.isRestrict())414memory.push_back(spv::Decoration::Restrict);415if (qualifier.isReadOnly())416memory.push_back(spv::Decoration::NonWritable);417if (qualifier.isWriteOnly())418memory.push_back(spv::Decoration::NonReadable);419}420421// Translate glslang type to SPIR-V layout decorations.422spv::Decoration TranslateLayoutDecoration(const glslang::TType& type, glslang::TLayoutMatrix matrixLayout)423{424if (type.isMatrix()) {425switch (matrixLayout) {426case glslang::ElmRowMajor:427return spv::Decoration::RowMajor;428case glslang::ElmColumnMajor:429return spv::Decoration::ColMajor;430default:431// opaque layouts don't need a majorness432return spv::Decoration::Max;433}434} else {435switch (type.getBasicType()) {436default:437return spv::Decoration::Max;438break;439case glslang::EbtBlock:440switch (type.getQualifier().storage) {441case glslang::EvqShared:442case glslang::EvqUniform:443case glslang::EvqBuffer:444switch (type.getQualifier().layoutPacking) {445case glslang::ElpShared: return spv::Decoration::GLSLShared;446case glslang::ElpPacked: return spv::Decoration::GLSLPacked;447default:448return spv::Decoration::Max;449}450case glslang::EvqVaryingIn:451case glslang::EvqVaryingOut:452if (type.getQualifier().isTaskMemory()) {453switch (type.getQualifier().layoutPacking) {454case glslang::ElpShared: return spv::Decoration::GLSLShared;455case glslang::ElpPacked: return spv::Decoration::GLSLPacked;456default: break;457}458} else {459assert(type.getQualifier().layoutPacking == glslang::ElpNone);460}461return spv::Decoration::Max;462case glslang::EvqPayload:463case glslang::EvqPayloadIn:464case glslang::EvqHitAttr:465case glslang::EvqCallableData:466case glslang::EvqCallableDataIn:467case glslang::EvqHitObjectAttrNV:468case glslang::EvqHitObjectAttrEXT:469return spv::Decoration::Max;470default:471assert(0);472return spv::Decoration::Max;473}474}475}476}477478// Translate glslang type to SPIR-V interpolation decorations.479// Returns spv::Decoration::Max when no decoration480// should be applied.481spv::Decoration TGlslangToSpvTraverser::TranslateInterpolationDecoration(const glslang::TQualifier& qualifier)482{483if (qualifier.smooth)484// Smooth decoration doesn't exist in SPIR-V 1.0485return spv::Decoration::Max;486else if (qualifier.isNonPerspective())487return spv::Decoration::NoPerspective;488else if (qualifier.flat)489return spv::Decoration::Flat;490else if (qualifier.isExplicitInterpolation()) {491builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);492return spv::Decoration::ExplicitInterpAMD;493}494else495return spv::Decoration::Max;496}497498// Translate glslang type to SPIR-V auxiliary storage decorations.499// Returns spv::Decoration::Max when no decoration500// should be applied.501spv::Decoration TGlslangToSpvTraverser::TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier)502{503if (qualifier.centroid)504return spv::Decoration::Centroid;505else if (qualifier.patch)506return spv::Decoration::Patch;507else if (qualifier.sample) {508builder.addCapability(spv::Capability::SampleRateShading);509return spv::Decoration::Sample;510}511512return spv::Decoration::Max;513}514515// If glslang type is invariant, return SPIR-V invariant decoration.516spv::Decoration TranslateInvariantDecoration(const glslang::TQualifier& qualifier)517{518if (qualifier.invariant)519return spv::Decoration::Invariant;520else521return spv::Decoration::Max;522}523524// If glslang type is noContraction, return SPIR-V NoContraction decoration.525spv::Decoration TranslateNoContractionDecoration(const glslang::TQualifier& qualifier)526{527if (qualifier.isNoContraction())528return spv::Decoration::NoContraction;529else530return spv::Decoration::Max;531}532533// If glslang type is nonUniform, return SPIR-V NonUniform decoration.534spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(const glslang::TQualifier& qualifier)535{536if (qualifier.isNonUniform()) {537builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);538builder.addCapability(spv::Capability::ShaderNonUniformEXT);539return spv::Decoration::NonUniformEXT;540} else541return spv::Decoration::Max;542}543544// If lvalue flags contains nonUniform, return SPIR-V NonUniform decoration.545spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(546const spv::Builder::AccessChain::CoherentFlags& coherentFlags)547{548if (coherentFlags.isNonUniform()) {549builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);550builder.addCapability(spv::Capability::ShaderNonUniformEXT);551return spv::Decoration::NonUniformEXT;552} else553return spv::Decoration::Max;554}555556spv::MemoryAccessMask TGlslangToSpvTraverser::TranslateMemoryAccess(557const spv::Builder::AccessChain::CoherentFlags &coherentFlags)558{559spv::MemoryAccessMask mask = spv::MemoryAccessMask::MaskNone;560561if (!glslangIntermediate->usingVulkanMemoryModel() || coherentFlags.isImage)562return mask;563564if (coherentFlags.isVolatile() || coherentFlags.anyCoherent()) {565mask = mask | spv::MemoryAccessMask::MakePointerAvailableKHR |566spv::MemoryAccessMask::MakePointerVisibleKHR;567}568569if (coherentFlags.nonprivate) {570mask = mask | spv::MemoryAccessMask::NonPrivatePointerKHR;571}572if (coherentFlags.volatil) {573mask = mask | spv::MemoryAccessMask::Volatile;574}575if (coherentFlags.nontemporal) {576mask = mask | spv::MemoryAccessMask::Nontemporal;577}578if (mask != spv::MemoryAccessMask::MaskNone) {579builder.addCapability(spv::Capability::VulkanMemoryModelKHR);580}581582return mask;583}584585spv::ImageOperandsMask TGlslangToSpvTraverser::TranslateImageOperands(586const spv::Builder::AccessChain::CoherentFlags &coherentFlags)587{588spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;589590if (!glslangIntermediate->usingVulkanMemoryModel())591return mask;592593if (coherentFlags.volatil ||594coherentFlags.anyCoherent()) {595mask = mask | spv::ImageOperandsMask::MakeTexelAvailableKHR |596spv::ImageOperandsMask::MakeTexelVisibleKHR;597}598if (coherentFlags.nonprivate) {599mask = mask | spv::ImageOperandsMask::NonPrivateTexelKHR;600}601if (coherentFlags.volatil) {602mask = mask | spv::ImageOperandsMask::VolatileTexelKHR;603}604if (coherentFlags.nontemporal && builder.getSpvVersion() >= spv::Spv_1_6) {605mask = mask | spv::ImageOperandsMask::Nontemporal;606}607if (mask != spv::ImageOperandsMask::MaskNone) {608builder.addCapability(spv::Capability::VulkanMemoryModelKHR);609}610611return mask;612}613614spv::Builder::AccessChain::CoherentFlags TGlslangToSpvTraverser::TranslateCoherent(const glslang::TType& type)615{616spv::Builder::AccessChain::CoherentFlags flags = {};617flags.coherent = type.getQualifier().coherent;618flags.devicecoherent = type.getQualifier().devicecoherent;619flags.queuefamilycoherent = type.getQualifier().queuefamilycoherent;620// shared variables are implicitly workgroupcoherent in GLSL.621flags.workgroupcoherent = type.getQualifier().workgroupcoherent ||622type.getQualifier().storage == glslang::EvqShared;623flags.subgroupcoherent = type.getQualifier().subgroupcoherent;624flags.shadercallcoherent = type.getQualifier().shadercallcoherent;625flags.volatil = type.getQualifier().volatil;626flags.nontemporal = type.getQualifier().nontemporal;627// *coherent variables are implicitly nonprivate in GLSL628flags.nonprivate = type.getQualifier().nonprivate ||629flags.anyCoherent() ||630flags.volatil;631flags.isImage = type.getBasicType() == glslang::EbtSampler;632flags.nonUniform = type.getQualifier().nonUniform;633return flags;634}635636spv::Scope TGlslangToSpvTraverser::TranslateMemoryScope(637const spv::Builder::AccessChain::CoherentFlags &coherentFlags)638{639spv::Scope scope = spv::Scope::Max;640641if (coherentFlags.volatil || coherentFlags.coherent) {642// coherent defaults to Device scope in the old model, QueueFamilyKHR scope in the new model643scope = glslangIntermediate->usingVulkanMemoryModel() ? spv::Scope::QueueFamilyKHR : spv::Scope::Device;644} else if (coherentFlags.devicecoherent) {645scope = spv::Scope::Device;646} else if (coherentFlags.queuefamilycoherent) {647scope = spv::Scope::QueueFamilyKHR;648} else if (coherentFlags.workgroupcoherent) {649scope = spv::Scope::Workgroup;650} else if (coherentFlags.subgroupcoherent) {651scope = spv::Scope::Subgroup;652} else if (coherentFlags.shadercallcoherent) {653scope = spv::Scope::ShaderCallKHR;654}655if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::Scope::Device) {656builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);657}658659return scope;660}661662// Translate a glslang built-in variable to a SPIR-V built in decoration. Also generate663// associated capabilities when required. For some built-in variables, a capability664// is generated only when using the variable in an executable instruction, but not when665// just declaring a struct member variable with it. This is true for PointSize,666// ClipDistance, and CullDistance.667spv::BuiltIn TGlslangToSpvTraverser::TranslateBuiltInDecoration(glslang::TBuiltInVariable builtIn,668bool memberDeclaration)669{670switch (builtIn) {671case glslang::EbvPointSize:672// Defer adding the capability until the built-in is actually used.673if (! memberDeclaration) {674switch (glslangIntermediate->getStage()) {675case EShLangGeometry:676builder.addCapability(spv::Capability::GeometryPointSize);677break;678case EShLangTessControl:679case EShLangTessEvaluation:680builder.addCapability(spv::Capability::TessellationPointSize);681break;682default:683break;684}685}686return spv::BuiltIn::PointSize;687688case glslang::EbvPosition: return spv::BuiltIn::Position;689case glslang::EbvVertexId: return spv::BuiltIn::VertexId;690case glslang::EbvInstanceId: return spv::BuiltIn::InstanceId;691case glslang::EbvVertexIndex: return spv::BuiltIn::VertexIndex;692case glslang::EbvInstanceIndex: return spv::BuiltIn::InstanceIndex;693694case glslang::EbvFragCoord: return spv::BuiltIn::FragCoord;695case glslang::EbvPointCoord: return spv::BuiltIn::PointCoord;696case glslang::EbvFace: return spv::BuiltIn::FrontFacing;697case glslang::EbvFragDepth: return spv::BuiltIn::FragDepth;698699case glslang::EbvNumWorkGroups: return spv::BuiltIn::NumWorkgroups;700case glslang::EbvWorkGroupSize: return spv::BuiltIn::WorkgroupSize;701case glslang::EbvWorkGroupId: return spv::BuiltIn::WorkgroupId;702case glslang::EbvLocalInvocationId: return spv::BuiltIn::LocalInvocationId;703case glslang::EbvLocalInvocationIndex: return spv::BuiltIn::LocalInvocationIndex;704case glslang::EbvGlobalInvocationId: return spv::BuiltIn::GlobalInvocationId;705706// These *Distance capabilities logically belong here, but if the member is declared and707// then never used, consumers of SPIR-V prefer the capability not be declared.708// They are now generated when used, rather than here when declared.709// Potentially, the specification should be more clear what the minimum710// use needed is to trigger the capability.711//712case glslang::EbvClipDistance:713if (!memberDeclaration)714builder.addCapability(spv::Capability::ClipDistance);715return spv::BuiltIn::ClipDistance;716717case glslang::EbvCullDistance:718if (!memberDeclaration)719builder.addCapability(spv::Capability::CullDistance);720return spv::BuiltIn::CullDistance;721722case glslang::EbvViewportIndex:723if (glslangIntermediate->getStage() == EShLangGeometry ||724glslangIntermediate->getStage() == EShLangFragment) {725builder.addCapability(spv::Capability::MultiViewport);726}727if (glslangIntermediate->getStage() == EShLangVertex ||728glslangIntermediate->getStage() == EShLangTessControl ||729glslangIntermediate->getStage() == EShLangTessEvaluation) {730731if (builder.getSpvVersion() < spv::Spv_1_5) {732builder.addIncorporatedExtension(spv::E_SPV_EXT_shader_viewport_index_layer, spv::Spv_1_5);733builder.addCapability(spv::Capability::ShaderViewportIndexLayerEXT);734}735else736builder.addCapability(spv::Capability::ShaderViewportIndex);737}738return spv::BuiltIn::ViewportIndex;739740case glslang::EbvSampleId:741builder.addCapability(spv::Capability::SampleRateShading);742return spv::BuiltIn::SampleId;743744case glslang::EbvSamplePosition:745builder.addCapability(spv::Capability::SampleRateShading);746return spv::BuiltIn::SamplePosition;747748case glslang::EbvSampleMask:749return spv::BuiltIn::SampleMask;750751case glslang::EbvLayer:752if (glslangIntermediate->getStage() == EShLangMesh) {753return spv::BuiltIn::Layer;754}755if (glslangIntermediate->getStage() == EShLangGeometry ||756glslangIntermediate->getStage() == EShLangFragment) {757builder.addCapability(spv::Capability::Geometry);758}759if (glslangIntermediate->getStage() == EShLangVertex ||760glslangIntermediate->getStage() == EShLangTessControl ||761glslangIntermediate->getStage() == EShLangTessEvaluation) {762763if (builder.getSpvVersion() < spv::Spv_1_5) {764builder.addIncorporatedExtension(spv::E_SPV_EXT_shader_viewport_index_layer, spv::Spv_1_5);765builder.addCapability(spv::Capability::ShaderViewportIndexLayerEXT);766} else767builder.addCapability(spv::Capability::ShaderLayer);768}769return spv::BuiltIn::Layer;770771case glslang::EbvBaseVertex:772builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);773builder.addCapability(spv::Capability::DrawParameters);774return spv::BuiltIn::BaseVertex;775776case glslang::EbvBaseInstance:777builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);778builder.addCapability(spv::Capability::DrawParameters);779return spv::BuiltIn::BaseInstance;780781case glslang::EbvDrawId:782builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);783builder.addCapability(spv::Capability::DrawParameters);784return spv::BuiltIn::DrawIndex;785786case glslang::EbvPrimitiveId:787if (glslangIntermediate->getStage() == EShLangFragment)788builder.addCapability(spv::Capability::Geometry);789return spv::BuiltIn::PrimitiveId;790791case glslang::EbvFragStencilRef:792builder.addExtension(spv::E_SPV_EXT_shader_stencil_export);793builder.addCapability(spv::Capability::StencilExportEXT);794return spv::BuiltIn::FragStencilRefEXT;795796case glslang::EbvShadingRateKHR:797builder.addExtension(spv::E_SPV_KHR_fragment_shading_rate);798builder.addCapability(spv::Capability::FragmentShadingRateKHR);799return spv::BuiltIn::ShadingRateKHR;800801case glslang::EbvPrimitiveShadingRateKHR:802builder.addExtension(spv::E_SPV_KHR_fragment_shading_rate);803builder.addCapability(spv::Capability::FragmentShadingRateKHR);804return spv::BuiltIn::PrimitiveShadingRateKHR;805806case glslang::EbvInvocationId: return spv::BuiltIn::InvocationId;807case glslang::EbvTessLevelInner: return spv::BuiltIn::TessLevelInner;808case glslang::EbvTessLevelOuter: return spv::BuiltIn::TessLevelOuter;809case glslang::EbvTessCoord: return spv::BuiltIn::TessCoord;810case glslang::EbvPatchVertices: return spv::BuiltIn::PatchVertices;811case glslang::EbvHelperInvocation: return spv::BuiltIn::HelperInvocation;812813case glslang::EbvSubGroupSize:814builder.addExtension(spv::E_SPV_KHR_shader_ballot);815builder.addCapability(spv::Capability::SubgroupBallotKHR);816return spv::BuiltIn::SubgroupSize;817818case glslang::EbvSubGroupInvocation:819builder.addExtension(spv::E_SPV_KHR_shader_ballot);820builder.addCapability(spv::Capability::SubgroupBallotKHR);821return spv::BuiltIn::SubgroupLocalInvocationId;822823case glslang::EbvSubGroupEqMask:824builder.addExtension(spv::E_SPV_KHR_shader_ballot);825builder.addCapability(spv::Capability::SubgroupBallotKHR);826return spv::BuiltIn::SubgroupEqMask;827828case glslang::EbvSubGroupGeMask:829builder.addExtension(spv::E_SPV_KHR_shader_ballot);830builder.addCapability(spv::Capability::SubgroupBallotKHR);831return spv::BuiltIn::SubgroupGeMask;832833case glslang::EbvSubGroupGtMask:834builder.addExtension(spv::E_SPV_KHR_shader_ballot);835builder.addCapability(spv::Capability::SubgroupBallotKHR);836return spv::BuiltIn::SubgroupGtMask;837838case glslang::EbvSubGroupLeMask:839builder.addExtension(spv::E_SPV_KHR_shader_ballot);840builder.addCapability(spv::Capability::SubgroupBallotKHR);841return spv::BuiltIn::SubgroupLeMask;842843case glslang::EbvSubGroupLtMask:844builder.addExtension(spv::E_SPV_KHR_shader_ballot);845builder.addCapability(spv::Capability::SubgroupBallotKHR);846return spv::BuiltIn::SubgroupLtMask;847848case glslang::EbvNumSubgroups:849builder.addCapability(spv::Capability::GroupNonUniform);850return spv::BuiltIn::NumSubgroups;851852case glslang::EbvSubgroupID:853builder.addCapability(spv::Capability::GroupNonUniform);854return spv::BuiltIn::SubgroupId;855856case glslang::EbvSubgroupSize2:857builder.addCapability(spv::Capability::GroupNonUniform);858return spv::BuiltIn::SubgroupSize;859860case glslang::EbvSubgroupInvocation2:861builder.addCapability(spv::Capability::GroupNonUniform);862return spv::BuiltIn::SubgroupLocalInvocationId;863864case glslang::EbvSubgroupEqMask2:865builder.addCapability(spv::Capability::GroupNonUniform);866builder.addCapability(spv::Capability::GroupNonUniformBallot);867return spv::BuiltIn::SubgroupEqMask;868869case glslang::EbvSubgroupGeMask2:870builder.addCapability(spv::Capability::GroupNonUniform);871builder.addCapability(spv::Capability::GroupNonUniformBallot);872return spv::BuiltIn::SubgroupGeMask;873874case glslang::EbvSubgroupGtMask2:875builder.addCapability(spv::Capability::GroupNonUniform);876builder.addCapability(spv::Capability::GroupNonUniformBallot);877return spv::BuiltIn::SubgroupGtMask;878879case glslang::EbvSubgroupLeMask2:880builder.addCapability(spv::Capability::GroupNonUniform);881builder.addCapability(spv::Capability::GroupNonUniformBallot);882return spv::BuiltIn::SubgroupLeMask;883884case glslang::EbvSubgroupLtMask2:885builder.addCapability(spv::Capability::GroupNonUniform);886builder.addCapability(spv::Capability::GroupNonUniformBallot);887return spv::BuiltIn::SubgroupLtMask;888889case glslang::EbvBaryCoordNoPersp:890builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);891return spv::BuiltIn::BaryCoordNoPerspAMD;892893case glslang::EbvBaryCoordNoPerspCentroid:894builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);895return spv::BuiltIn::BaryCoordNoPerspCentroidAMD;896897case glslang::EbvBaryCoordNoPerspSample:898builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);899return spv::BuiltIn::BaryCoordNoPerspSampleAMD;900901case glslang::EbvBaryCoordSmooth:902builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);903return spv::BuiltIn::BaryCoordSmoothAMD;904905case glslang::EbvBaryCoordSmoothCentroid:906builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);907return spv::BuiltIn::BaryCoordSmoothCentroidAMD;908909case glslang::EbvBaryCoordSmoothSample:910builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);911return spv::BuiltIn::BaryCoordSmoothSampleAMD;912913case glslang::EbvBaryCoordPullModel:914builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);915return spv::BuiltIn::BaryCoordPullModelAMD;916917case glslang::EbvDeviceIndex:918builder.addIncorporatedExtension(spv::E_SPV_KHR_device_group, spv::Spv_1_3);919builder.addCapability(spv::Capability::DeviceGroup);920return spv::BuiltIn::DeviceIndex;921922case glslang::EbvViewIndex:923builder.addIncorporatedExtension(spv::E_SPV_KHR_multiview, spv::Spv_1_3);924builder.addCapability(spv::Capability::MultiView);925return spv::BuiltIn::ViewIndex;926927case glslang::EbvFragSizeEXT:928builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);929builder.addCapability(spv::Capability::FragmentDensityEXT);930return spv::BuiltIn::FragSizeEXT;931932case glslang::EbvFragInvocationCountEXT:933builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);934builder.addCapability(spv::Capability::FragmentDensityEXT);935return spv::BuiltIn::FragInvocationCountEXT;936937case glslang::EbvViewportMaskNV:938if (!memberDeclaration) {939builder.addExtension(spv::E_SPV_NV_viewport_array2);940builder.addCapability(spv::Capability::ShaderViewportMaskNV);941}942return spv::BuiltIn::ViewportMaskNV;943case glslang::EbvSecondaryPositionNV:944if (!memberDeclaration) {945builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);946builder.addCapability(spv::Capability::ShaderStereoViewNV);947}948return spv::BuiltIn::SecondaryPositionNV;949case glslang::EbvSecondaryViewportMaskNV:950if (!memberDeclaration) {951builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);952builder.addCapability(spv::Capability::ShaderStereoViewNV);953}954return spv::BuiltIn::SecondaryViewportMaskNV;955case glslang::EbvPositionPerViewNV:956if (!memberDeclaration) {957builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);958builder.addCapability(spv::Capability::PerViewAttributesNV);959}960return spv::BuiltIn::PositionPerViewNV;961case glslang::EbvViewportMaskPerViewNV:962if (!memberDeclaration) {963builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);964builder.addCapability(spv::Capability::PerViewAttributesNV);965}966return spv::BuiltIn::ViewportMaskPerViewNV;967case glslang::EbvFragFullyCoveredNV:968builder.addExtension(spv::E_SPV_EXT_fragment_fully_covered);969builder.addCapability(spv::Capability::FragmentFullyCoveredEXT);970return spv::BuiltIn::FullyCoveredEXT;971case glslang::EbvFragmentSizeNV:972builder.addExtension(spv::E_SPV_NV_shading_rate);973builder.addCapability(spv::Capability::ShadingRateNV);974return spv::BuiltIn::FragmentSizeNV;975case glslang::EbvInvocationsPerPixelNV:976builder.addExtension(spv::E_SPV_NV_shading_rate);977builder.addCapability(spv::Capability::ShadingRateNV);978return spv::BuiltIn::InvocationsPerPixelNV;979980// ray tracing981case glslang::EbvLaunchId:982return spv::BuiltIn::LaunchIdKHR;983case glslang::EbvLaunchSize:984return spv::BuiltIn::LaunchSizeKHR;985case glslang::EbvWorldRayOrigin:986return spv::BuiltIn::WorldRayOriginKHR;987case glslang::EbvWorldRayDirection:988return spv::BuiltIn::WorldRayDirectionKHR;989case glslang::EbvObjectRayOrigin:990return spv::BuiltIn::ObjectRayOriginKHR;991case glslang::EbvObjectRayDirection:992return spv::BuiltIn::ObjectRayDirectionKHR;993case glslang::EbvRayTmin:994return spv::BuiltIn::RayTminKHR;995case glslang::EbvRayTmax:996return spv::BuiltIn::RayTmaxKHR;997case glslang::EbvCullMask:998return spv::BuiltIn::CullMaskKHR;999case glslang::EbvPositionFetch:1000return spv::BuiltIn::HitTriangleVertexPositionsKHR;1001case glslang::EbvInstanceCustomIndex:1002return spv::BuiltIn::InstanceCustomIndexKHR;1003case glslang::EbvHitKind:1004return spv::BuiltIn::HitKindKHR;1005case glslang::EbvObjectToWorld:1006case glslang::EbvObjectToWorld3x4:1007return spv::BuiltIn::ObjectToWorldKHR;1008case glslang::EbvWorldToObject:1009case glslang::EbvWorldToObject3x4:1010return spv::BuiltIn::WorldToObjectKHR;1011case glslang::EbvIncomingRayFlags:1012return spv::BuiltIn::IncomingRayFlagsKHR;1013case glslang::EbvGeometryIndex:1014return spv::BuiltIn::RayGeometryIndexKHR;1015case glslang::EbvCurrentRayTimeNV:1016builder.addExtension(spv::E_SPV_NV_ray_tracing_motion_blur);1017builder.addCapability(spv::Capability::RayTracingMotionBlurNV);1018return spv::BuiltIn::CurrentRayTimeNV;1019case glslang::EbvMicroTrianglePositionNV:1020builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);1021builder.addExtension("SPV_NV_displacement_micromap");1022return spv::BuiltIn::HitMicroTriangleVertexPositionsNV;1023case glslang::EbvMicroTriangleBaryNV:1024builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);1025builder.addExtension("SPV_NV_displacement_micromap");1026return spv::BuiltIn::HitMicroTriangleVertexBarycentricsNV;1027case glslang::EbvHitKindFrontFacingMicroTriangleNV:1028builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);1029builder.addExtension("SPV_NV_displacement_micromap");1030return spv::BuiltIn::HitKindFrontFacingMicroTriangleNV;1031case glslang::EbvHitKindBackFacingMicroTriangleNV:1032builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);1033builder.addExtension("SPV_NV_displacement_micromap");1034return spv::BuiltIn::HitKindBackFacingMicroTriangleNV;1035case glslang::EbvClusterIDNV:1036builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);1037builder.addExtension("SPV_NV_cluster_acceleration_structure");1038return spv::BuiltIn::ClusterIDNV;1039case glslang::EbvHitIsSphereNV:1040builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);1041builder.addExtension("SPV_NV_linear_swept_spheres");1042return spv::BuiltIn::HitIsSphereNV;1043case glslang::EbvHitIsLSSNV:1044builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);1045builder.addExtension("SPV_NV_linear_swept_spheres");1046return spv::BuiltIn::HitIsLSSNV;1047case glslang::EbvHitSpherePositionNV:1048builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);1049builder.addExtension("SPV_NV_linear_swept_spheres");1050return spv::BuiltIn::HitSpherePositionNV;1051case glslang::EbvHitSphereRadiusNV:1052builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);1053builder.addExtension("SPV_NV_linear_swept_spheres");1054return spv::BuiltIn::HitSphereRadiusNV;1055case glslang::EbvHitLSSPositionsNV:1056builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);1057builder.addExtension("SPV_NV_linear_swept_spheres");1058return spv::BuiltIn::HitLSSPositionsNV;1059case glslang::EbvHitLSSRadiiNV:1060builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);1061builder.addExtension("SPV_NV_linear_swept_spheres");1062return spv::BuiltIn::HitLSSRadiiNV;10631064// barycentrics1065case glslang::EbvBaryCoordNV:1066builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);1067builder.addCapability(spv::Capability::FragmentBarycentricNV);1068return spv::BuiltIn::BaryCoordNV;1069case glslang::EbvBaryCoordNoPerspNV:1070builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);1071builder.addCapability(spv::Capability::FragmentBarycentricNV);1072return spv::BuiltIn::BaryCoordNoPerspNV;10731074case glslang::EbvBaryCoordEXT:1075builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);1076builder.addCapability(spv::Capability::FragmentBarycentricKHR);1077return spv::BuiltIn::BaryCoordKHR;1078case glslang::EbvBaryCoordNoPerspEXT:1079builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);1080builder.addCapability(spv::Capability::FragmentBarycentricKHR);1081return spv::BuiltIn::BaryCoordNoPerspKHR;10821083// mesh shaders1084case glslang::EbvTaskCountNV:1085return spv::BuiltIn::TaskCountNV;1086case glslang::EbvPrimitiveCountNV:1087return spv::BuiltIn::PrimitiveCountNV;1088case glslang::EbvPrimitiveIndicesNV:1089return spv::BuiltIn::PrimitiveIndicesNV;1090case glslang::EbvClipDistancePerViewNV:1091return spv::BuiltIn::ClipDistancePerViewNV;1092case glslang::EbvCullDistancePerViewNV:1093return spv::BuiltIn::CullDistancePerViewNV;1094case glslang::EbvLayerPerViewNV:1095return spv::BuiltIn::LayerPerViewNV;1096case glslang::EbvMeshViewCountNV:1097return spv::BuiltIn::MeshViewCountNV;1098case glslang::EbvMeshViewIndicesNV:1099return spv::BuiltIn::MeshViewIndicesNV;11001101// SPV_EXT_mesh_shader1102case glslang::EbvPrimitivePointIndicesEXT:1103return spv::BuiltIn::PrimitivePointIndicesEXT;1104case glslang::EbvPrimitiveLineIndicesEXT:1105return spv::BuiltIn::PrimitiveLineIndicesEXT;1106case glslang::EbvPrimitiveTriangleIndicesEXT:1107return spv::BuiltIn::PrimitiveTriangleIndicesEXT;1108case glslang::EbvCullPrimitiveEXT:1109return spv::BuiltIn::CullPrimitiveEXT;11101111// sm builtins1112case glslang::EbvWarpsPerSM:1113builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);1114builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);1115return spv::BuiltIn::WarpsPerSMNV;1116case glslang::EbvSMCount:1117builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);1118builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);1119return spv::BuiltIn::SMCountNV;1120case glslang::EbvWarpID:1121builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);1122builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);1123return spv::BuiltIn::WarpIDNV;1124case glslang::EbvSMID:1125builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);1126builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);1127return spv::BuiltIn::SMIDNV;11281129// ARM builtins1130case glslang::EbvCoreCountARM:1131builder.addExtension(spv::E_SPV_ARM_core_builtins);1132builder.addCapability(spv::Capability::CoreBuiltinsARM);1133return spv::BuiltIn::CoreCountARM;1134case glslang::EbvCoreIDARM:1135builder.addExtension(spv::E_SPV_ARM_core_builtins);1136builder.addCapability(spv::Capability::CoreBuiltinsARM);1137return spv::BuiltIn::CoreIDARM;1138case glslang::EbvCoreMaxIDARM:1139builder.addExtension(spv::E_SPV_ARM_core_builtins);1140builder.addCapability(spv::Capability::CoreBuiltinsARM);1141return spv::BuiltIn::CoreMaxIDARM;1142case glslang::EbvWarpIDARM:1143builder.addExtension(spv::E_SPV_ARM_core_builtins);1144builder.addCapability(spv::Capability::CoreBuiltinsARM);1145return spv::BuiltIn::WarpIDARM;1146case glslang::EbvWarpMaxIDARM:1147builder.addExtension(spv::E_SPV_ARM_core_builtins);1148builder.addCapability(spv::Capability::CoreBuiltinsARM);1149return spv::BuiltIn::WarpMaxIDARM;11501151// QCOM builtins1152case glslang::EbvTileOffsetQCOM:1153builder.addExtension(spv::E_SPV_QCOM_tile_shading);1154return spv::BuiltIn::TileOffsetQCOM;1155case glslang::EbvTileDimensionQCOM:1156builder.addExtension(spv::E_SPV_QCOM_tile_shading);1157return spv::BuiltIn::TileDimensionQCOM;1158case glslang::EbvTileApronSizeQCOM:1159builder.addExtension(spv::E_SPV_QCOM_tile_shading);1160return spv::BuiltIn::TileApronSizeQCOM;11611162default:1163return spv::BuiltIn::Max;1164}1165}11661167// Translate glslang image layout format to SPIR-V image format.1168spv::ImageFormat TGlslangToSpvTraverser::TranslateImageFormat(const glslang::TType& type)1169{1170assert(type.getBasicType() == glslang::EbtSampler);11711172// Check for capabilities1173switch (type.getQualifier().getFormat()) {1174case glslang::ElfRg32f:1175case glslang::ElfRg16f:1176case glslang::ElfR11fG11fB10f:1177case glslang::ElfR16f:1178case glslang::ElfRgba16:1179case glslang::ElfRgb10A2:1180case glslang::ElfRg16:1181case glslang::ElfRg8:1182case glslang::ElfR16:1183case glslang::ElfR8:1184case glslang::ElfRgba16Snorm:1185case glslang::ElfRg16Snorm:1186case glslang::ElfRg8Snorm:1187case glslang::ElfR16Snorm:1188case glslang::ElfR8Snorm:11891190case glslang::ElfRg32i:1191case glslang::ElfRg16i:1192case glslang::ElfRg8i:1193case glslang::ElfR16i:1194case glslang::ElfR8i:11951196case glslang::ElfRgb10a2ui:1197case glslang::ElfRg32ui:1198case glslang::ElfRg16ui:1199case glslang::ElfRg8ui:1200case glslang::ElfR16ui:1201case glslang::ElfR8ui:1202builder.addCapability(spv::Capability::StorageImageExtendedFormats);1203break;12041205case glslang::ElfR64ui:1206case glslang::ElfR64i:1207builder.addExtension(spv::E_SPV_EXT_shader_image_int64);1208builder.addCapability(spv::Capability::Int64ImageEXT);1209break;1210default:1211break;1212}12131214// do the translation1215switch (type.getQualifier().getFormat()) {1216case glslang::ElfNone: return spv::ImageFormat::Unknown;1217case glslang::ElfRgba32f: return spv::ImageFormat::Rgba32f;1218case glslang::ElfRgba16f: return spv::ImageFormat::Rgba16f;1219case glslang::ElfR32f: return spv::ImageFormat::R32f;1220case glslang::ElfRgba8: return spv::ImageFormat::Rgba8;1221case glslang::ElfRgba8Snorm: return spv::ImageFormat::Rgba8Snorm;1222case glslang::ElfRg32f: return spv::ImageFormat::Rg32f;1223case glslang::ElfRg16f: return spv::ImageFormat::Rg16f;1224case glslang::ElfR11fG11fB10f: return spv::ImageFormat::R11fG11fB10f;1225case glslang::ElfR16f: return spv::ImageFormat::R16f;1226case glslang::ElfRgba16: return spv::ImageFormat::Rgba16;1227case glslang::ElfRgb10A2: return spv::ImageFormat::Rgb10A2;1228case glslang::ElfRg16: return spv::ImageFormat::Rg16;1229case glslang::ElfRg8: return spv::ImageFormat::Rg8;1230case glslang::ElfR16: return spv::ImageFormat::R16;1231case glslang::ElfR8: return spv::ImageFormat::R8;1232case glslang::ElfRgba16Snorm: return spv::ImageFormat::Rgba16Snorm;1233case glslang::ElfRg16Snorm: return spv::ImageFormat::Rg16Snorm;1234case glslang::ElfRg8Snorm: return spv::ImageFormat::Rg8Snorm;1235case glslang::ElfR16Snorm: return spv::ImageFormat::R16Snorm;1236case glslang::ElfR8Snorm: return spv::ImageFormat::R8Snorm;1237case glslang::ElfRgba32i: return spv::ImageFormat::Rgba32i;1238case glslang::ElfRgba16i: return spv::ImageFormat::Rgba16i;1239case glslang::ElfRgba8i: return spv::ImageFormat::Rgba8i;1240case glslang::ElfR32i: return spv::ImageFormat::R32i;1241case glslang::ElfRg32i: return spv::ImageFormat::Rg32i;1242case glslang::ElfRg16i: return spv::ImageFormat::Rg16i;1243case glslang::ElfRg8i: return spv::ImageFormat::Rg8i;1244case glslang::ElfR16i: return spv::ImageFormat::R16i;1245case glslang::ElfR8i: return spv::ImageFormat::R8i;1246case glslang::ElfRgba32ui: return spv::ImageFormat::Rgba32ui;1247case glslang::ElfRgba16ui: return spv::ImageFormat::Rgba16ui;1248case glslang::ElfRgba8ui: return spv::ImageFormat::Rgba8ui;1249case glslang::ElfR32ui: return spv::ImageFormat::R32ui;1250case glslang::ElfRg32ui: return spv::ImageFormat::Rg32ui;1251case glslang::ElfRg16ui: return spv::ImageFormat::Rg16ui;1252case glslang::ElfRgb10a2ui: return spv::ImageFormat::Rgb10a2ui;1253case glslang::ElfRg8ui: return spv::ImageFormat::Rg8ui;1254case glslang::ElfR16ui: return spv::ImageFormat::R16ui;1255case glslang::ElfR8ui: return spv::ImageFormat::R8ui;1256case glslang::ElfR64ui: return spv::ImageFormat::R64ui;1257case glslang::ElfR64i: return spv::ImageFormat::R64i;1258default: return spv::ImageFormat::Max;1259}1260}12611262spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSelectionControl(1263const glslang::TIntermSelection& selectionNode) const1264{1265if (selectionNode.getFlatten())1266return spv::SelectionControlMask::Flatten;1267if (selectionNode.getDontFlatten())1268return spv::SelectionControlMask::DontFlatten;1269return spv::SelectionControlMask::MaskNone;1270}12711272spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSwitchControl(const glslang::TIntermSwitch& switchNode)1273const1274{1275if (switchNode.getFlatten())1276return spv::SelectionControlMask::Flatten;1277if (switchNode.getDontFlatten())1278return spv::SelectionControlMask::DontFlatten;1279return spv::SelectionControlMask::MaskNone;1280}12811282// return a non-0 dependency if the dependency argument must be set1283spv::LoopControlMask TGlslangToSpvTraverser::TranslateLoopControl(const glslang::TIntermLoop& loopNode,1284std::vector<unsigned int>& operands) const1285{1286spv::LoopControlMask control = spv::LoopControlMask::MaskNone;12871288if (loopNode.getDontUnroll())1289control = control | spv::LoopControlMask::DontUnroll;1290if (loopNode.getUnroll())1291control = control | spv::LoopControlMask::Unroll;1292if (unsigned(loopNode.getLoopDependency()) == glslang::TIntermLoop::dependencyInfinite)1293control = control | spv::LoopControlMask::DependencyInfinite;1294else if (loopNode.getLoopDependency() > 0) {1295control = control | spv::LoopControlMask::DependencyLength;1296operands.push_back((unsigned int)loopNode.getLoopDependency());1297}1298if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {1299if (loopNode.getMinIterations() > 0) {1300control = control | spv::LoopControlMask::MinIterations;1301operands.push_back(loopNode.getMinIterations());1302}1303if (loopNode.getMaxIterations() < glslang::TIntermLoop::iterationsInfinite) {1304control = control | spv::LoopControlMask::MaxIterations;1305operands.push_back(loopNode.getMaxIterations());1306}1307if (loopNode.getIterationMultiple() > 1) {1308control = control | spv::LoopControlMask::IterationMultiple;1309operands.push_back(loopNode.getIterationMultiple());1310}1311if (loopNode.getPeelCount() > 0) {1312control = control | spv::LoopControlMask::PeelCount;1313operands.push_back(loopNode.getPeelCount());1314}1315if (loopNode.getPartialCount() > 0) {1316control = control | spv::LoopControlMask::PartialCount;1317operands.push_back(loopNode.getPartialCount());1318}1319}13201321return control;1322}13231324// Translate glslang type to SPIR-V storage class.1325spv::StorageClass TGlslangToSpvTraverser::TranslateStorageClass(const glslang::TType& type)1326{1327if (type.getBasicType() == glslang::EbtRayQuery || type.getBasicType() == glslang::EbtHitObjectNV1328|| type.getBasicType() == glslang::EbtHitObjectEXT)1329return spv::StorageClass::Private;1330if (type.getQualifier().isSpirvByReference()) {1331if (type.getQualifier().isParamInput() || type.getQualifier().isParamOutput())1332return spv::StorageClass::Function;1333}1334if (type.getQualifier().isPipeInput())1335return spv::StorageClass::Input;1336if (type.getQualifier().isPipeOutput())1337return spv::StorageClass::Output;1338if (type.getQualifier().storage == glslang::EvqTileImageEXT || type.isAttachmentEXT()) {1339builder.addExtension(spv::E_SPV_EXT_shader_tile_image);1340builder.addCapability(spv::Capability::TileImageColorReadAccessEXT);1341return spv::StorageClass::TileImageEXT;1342}13431344if (type.getQualifier().isTileAttachmentQCOM()) {1345builder.addExtension(spv::E_SPV_QCOM_tile_shading);1346builder.addCapability(spv::Capability::TileShadingQCOM);1347return spv::StorageClass::TileAttachmentQCOM;1348}13491350if (glslangIntermediate->getSource() != glslang::EShSourceHlsl ||1351type.getQualifier().storage == glslang::EvqUniform) {1352if (type.isAtomic())1353return spv::StorageClass::AtomicCounter;1354if (type.containsOpaque() && !glslangIntermediate->getBindlessMode())1355return spv::StorageClass::UniformConstant;1356}13571358if (type.getQualifier().isUniformOrBuffer() &&1359type.getQualifier().isShaderRecord()) {1360return spv::StorageClass::ShaderRecordBufferKHR;1361}13621363if (glslangIntermediate->usingStorageBuffer() && type.getQualifier().storage == glslang::EvqBuffer) {1364builder.addIncorporatedExtension(spv::E_SPV_KHR_storage_buffer_storage_class, spv::Spv_1_3);1365return spv::StorageClass::StorageBuffer;1366}13671368if (type.getQualifier().isUniformOrBuffer()) {1369if (type.getQualifier().isPushConstant())1370return spv::StorageClass::PushConstant;1371if (type.getBasicType() == glslang::EbtBlock)1372return spv::StorageClass::Uniform;1373return spv::StorageClass::UniformConstant;1374}13751376if (type.getQualifier().storage == glslang::EvqShared && type.getBasicType() == glslang::EbtBlock) {1377builder.addExtension(spv::E_SPV_KHR_workgroup_memory_explicit_layout);1378builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayoutKHR);1379return spv::StorageClass::Workgroup;1380}13811382switch (type.getQualifier().storage) {1383case glslang::EvqGlobal: return spv::StorageClass::Private;1384case glslang::EvqConstReadOnly: return spv::StorageClass::Function;1385case glslang::EvqTemporary: return spv::StorageClass::Function;1386case glslang::EvqShared: return spv::StorageClass::Workgroup;1387case glslang::EvqPayload: return spv::StorageClass::RayPayloadKHR;1388case glslang::EvqPayloadIn: return spv::StorageClass::IncomingRayPayloadKHR;1389case glslang::EvqHitAttr: return spv::StorageClass::HitAttributeKHR;1390case glslang::EvqCallableData: return spv::StorageClass::CallableDataKHR;1391case glslang::EvqCallableDataIn: return spv::StorageClass::IncomingCallableDataKHR;1392case glslang::EvqtaskPayloadSharedEXT : return spv::StorageClass::TaskPayloadWorkgroupEXT;1393case glslang::EvqHitObjectAttrNV: return spv::StorageClass::HitObjectAttributeNV;1394case glslang::EvqHitObjectAttrEXT: return spv::StorageClass::HitObjectAttributeEXT;1395case glslang::EvqSpirvStorageClass: return static_cast<spv::StorageClass>(type.getQualifier().spirvStorageClass);1396default:1397assert(0);1398break;1399}14001401return spv::StorageClass::Function;1402}14031404// Translate glslang constants to SPIR-V literals1405void TGlslangToSpvTraverser::TranslateLiterals(const glslang::TVector<const glslang::TIntermConstantUnion*>& constants,1406std::vector<unsigned>& literals) const1407{1408for (auto constant : constants) {1409if (constant->getBasicType() == glslang::EbtFloat) {1410float floatValue = static_cast<float>(constant->getConstArray()[0].getDConst());1411unsigned literal;1412static_assert(sizeof(literal) == sizeof(floatValue), "sizeof(unsigned) != sizeof(float)");1413memcpy(&literal, &floatValue, sizeof(literal));1414literals.push_back(literal);1415} else if (constant->getBasicType() == glslang::EbtInt) {1416unsigned literal = constant->getConstArray()[0].getIConst();1417literals.push_back(literal);1418} else if (constant->getBasicType() == glslang::EbtUint) {1419unsigned literal = constant->getConstArray()[0].getUConst();1420literals.push_back(literal);1421} else if (constant->getBasicType() == glslang::EbtBool) {1422unsigned literal = constant->getConstArray()[0].getBConst();1423literals.push_back(literal);1424} else if (constant->getBasicType() == glslang::EbtString) {1425auto str = constant->getConstArray()[0].getSConst()->c_str();1426unsigned literal = 0;1427char* literalPtr = reinterpret_cast<char*>(&literal);1428unsigned charCount = 0;1429char ch = 0;1430do {1431ch = *(str++);1432*(literalPtr++) = ch;1433++charCount;1434if (charCount == 4) {1435literals.push_back(literal);1436literalPtr = reinterpret_cast<char*>(&literal);1437charCount = 0;1438}1439} while (ch != 0);14401441// Partial literal is padded with 01442if (charCount > 0) {1443for (; charCount < 4; ++charCount)1444*(literalPtr++) = 0;1445literals.push_back(literal);1446}1447} else1448assert(0); // Unexpected type1449}1450}14511452// Add capabilities pertaining to how an array is indexed.1453void TGlslangToSpvTraverser::addIndirectionIndexCapabilities(const glslang::TType& baseType,1454const glslang::TType& indexType)1455{1456if (indexType.getQualifier().isNonUniform()) {1457// deal with an asserted non-uniform index1458// SPV_EXT_descriptor_indexing already added in TranslateNonUniformDecoration1459if (baseType.getBasicType() == glslang::EbtSampler) {1460if (baseType.getQualifier().hasAttachment())1461builder.addCapability(spv::Capability::InputAttachmentArrayNonUniformIndexingEXT);1462else if (baseType.isImage() && baseType.getSampler().isBuffer())1463builder.addCapability(spv::Capability::StorageTexelBufferArrayNonUniformIndexingEXT);1464else if (baseType.isTexture() && baseType.getSampler().isBuffer())1465builder.addCapability(spv::Capability::UniformTexelBufferArrayNonUniformIndexingEXT);1466else if (baseType.isImage())1467builder.addCapability(spv::Capability::StorageImageArrayNonUniformIndexingEXT);1468else if (baseType.isTexture())1469builder.addCapability(spv::Capability::SampledImageArrayNonUniformIndexingEXT);1470} else if (baseType.getBasicType() == glslang::EbtBlock) {1471if (baseType.getQualifier().storage == glslang::EvqBuffer)1472builder.addCapability(spv::Capability::StorageBufferArrayNonUniformIndexingEXT);1473else if (baseType.getQualifier().storage == glslang::EvqUniform)1474builder.addCapability(spv::Capability::UniformBufferArrayNonUniformIndexingEXT);1475}1476} else {1477// assume a dynamically uniform index1478if (baseType.getBasicType() == glslang::EbtSampler) {1479if (baseType.getQualifier().hasAttachment()) {1480builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);1481builder.addCapability(spv::Capability::InputAttachmentArrayDynamicIndexingEXT);1482} else if (baseType.isImage() && baseType.getSampler().isBuffer()) {1483builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);1484builder.addCapability(spv::Capability::StorageTexelBufferArrayDynamicIndexingEXT);1485} else if (baseType.isTexture() && baseType.getSampler().isBuffer()) {1486builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);1487builder.addCapability(spv::Capability::UniformTexelBufferArrayDynamicIndexingEXT);1488}1489}1490}1491}14921493// Return whether or not the given type is something that should be tied to a1494// descriptor set.1495bool IsDescriptorResource(const glslang::TType& type)1496{1497// uniform and buffer blocks are included, unless it is a push_constant1498if (type.getBasicType() == glslang::EbtBlock)1499return type.getQualifier().isUniformOrBuffer() &&1500! type.getQualifier().isShaderRecord() &&1501! type.getQualifier().isPushConstant();15021503// non block...1504// basically samplerXXX/subpass/sampler/texture are all included1505// if they are the global-scope-class, not the function parameter1506// (or local, if they ever exist) class.1507if (type.getBasicType() == glslang::EbtSampler ||1508type.getBasicType() == glslang::EbtAccStruct)1509return type.getQualifier().isUniformOrBuffer();15101511// Tensors are tied to a descriptor.1512if (type.isTensorARM())1513return true;15141515// None of the above.1516return false;1517}15181519void InheritQualifiers(glslang::TQualifier& child, const glslang::TQualifier& parent)1520{1521if (child.layoutMatrix == glslang::ElmNone)1522child.layoutMatrix = parent.layoutMatrix;15231524if (parent.invariant)1525child.invariant = true;1526if (parent.flat)1527child.flat = true;1528if (parent.centroid)1529child.centroid = true;1530if (parent.nopersp)1531child.nopersp = true;1532if (parent.explicitInterp)1533child.explicitInterp = true;1534if (parent.perPrimitiveNV)1535child.perPrimitiveNV = true;1536if (parent.perViewNV)1537child.perViewNV = true;1538if (parent.perTaskNV)1539child.perTaskNV = true;1540if (parent.storage == glslang::EvqtaskPayloadSharedEXT)1541child.storage = glslang::EvqtaskPayloadSharedEXT;1542if (parent.patch)1543child.patch = true;1544if (parent.sample)1545child.sample = true;1546if (parent.coherent)1547child.coherent = true;1548if (parent.devicecoherent)1549child.devicecoherent = true;1550if (parent.queuefamilycoherent)1551child.queuefamilycoherent = true;1552if (parent.workgroupcoherent)1553child.workgroupcoherent = true;1554if (parent.subgroupcoherent)1555child.subgroupcoherent = true;1556if (parent.shadercallcoherent)1557child.shadercallcoherent = true;1558if (parent.nonprivate)1559child.nonprivate = true;1560if (parent.volatil)1561child.volatil = true;1562if (parent.nontemporal)1563child.nontemporal = true;1564if (parent.restrict)1565child.restrict = true;1566if (parent.readonly)1567child.readonly = true;1568if (parent.writeonly)1569child.writeonly = true;1570if (parent.nonUniform)1571child.nonUniform = true;1572}15731574bool HasNonLayoutQualifiers(const glslang::TType& type, const glslang::TQualifier& qualifier)1575{1576// This should list qualifiers that simultaneous satisfy:1577// - struct members might inherit from a struct declaration1578// (note that non-block structs don't explicitly inherit,1579// only implicitly, meaning no decoration involved)1580// - affect decorations on the struct members1581// (note smooth does not, and expecting something like volatile1582// to effect the whole object)1583// - are not part of the offset/st430/etc or row/column-major layout1584return qualifier.invariant || (qualifier.hasLocation() && type.getBasicType() == glslang::EbtBlock);1585}15861587//1588// Implement the TGlslangToSpvTraverser class.1589//15901591TGlslangToSpvTraverser::TGlslangToSpvTraverser(unsigned int spvVersion,1592const glslang::TIntermediate* glslangIntermediate,1593spv::SpvBuildLogger* buildLogger, glslang::SpvOptions& options) :1594TIntermTraverser(true, false, true),1595options(options),1596shaderEntry(nullptr), currentFunction(nullptr),1597sequenceDepth(0), logger(buildLogger),1598builder(spvVersion, (glslang::GetKhronosToolId() << 16) | glslang::GetSpirvGeneratorVersion(), logger),1599inEntryPoint(false), entryPointTerminated(false), linkageOnly(false),1600glslangIntermediate(glslangIntermediate),1601nanMinMaxClamp(glslangIntermediate->getNanMinMaxClamp()),1602nonSemanticDebugPrintf(0),1603taskPayloadID(0)1604{1605bool isMeshShaderExt = (glslangIntermediate->getRequestedExtensions().find(glslang::E_GL_EXT_mesh_shader) !=1606glslangIntermediate->getRequestedExtensions().end());1607spv::ExecutionModel executionModel = TranslateExecutionModel(glslangIntermediate->getStage(), isMeshShaderExt);16081609builder.clearAccessChain();1610builder.setSource(TranslateSourceLanguage(glslangIntermediate->getSource(), glslangIntermediate->getProfile()),1611glslangIntermediate->getVersion());16121613if (options.emitNonSemanticShaderDebugSource)1614this->options.emitNonSemanticShaderDebugInfo = true;1615if (options.emitNonSemanticShaderDebugInfo)1616this->options.generateDebugInfo = true;16171618if (this->options.generateDebugInfo) {1619if (this->options.emitNonSemanticShaderDebugInfo) {1620builder.setEmitNonSemanticShaderDebugInfo(this->options.emitNonSemanticShaderDebugSource);1621}1622else {1623builder.setEmitSpirvDebugInfo();1624}1625builder.setDebugMainSourceFile(glslangIntermediate->getSourceFile());16261627// Set the source shader's text. If for SPV version 1.0, include1628// a preamble in comments stating the OpModuleProcessed instructions.1629// Otherwise, emit those as actual instructions.1630std::string text;1631const std::vector<std::string>& processes = glslangIntermediate->getProcesses();1632for (int p = 0; p < (int)processes.size(); ++p) {1633if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1) {1634text.append("// OpModuleProcessed ");1635text.append(processes[p]);1636text.append("\n");1637} else1638builder.addModuleProcessed(processes[p]);1639}1640if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1 && (int)processes.size() > 0)1641text.append("#line 1\n");1642text.append(glslangIntermediate->getSourceText());1643builder.setSourceText(text);1644// Pass name and text for all included files1645const std::map<std::string, std::string>& include_txt = glslangIntermediate->getIncludeText();1646for (auto iItr = include_txt.begin(); iItr != include_txt.end(); ++iItr)1647builder.addInclude(iItr->first, iItr->second);1648}16491650builder.setUseReplicatedComposites(glslangIntermediate->usingReplicatedComposites());16511652stdBuiltins = builder.import("GLSL.std.450");16531654spv::AddressingModel addressingModel = spv::AddressingModel::Logical;1655spv::MemoryModel memoryModel = spv::MemoryModel::GLSL450;16561657if (glslangIntermediate->usingPhysicalStorageBuffer()) {1658addressingModel = spv::AddressingModel::PhysicalStorageBuffer64EXT;1659builder.addIncorporatedExtension(spv::E_SPV_KHR_physical_storage_buffer, spv::Spv_1_5);1660builder.addCapability(spv::Capability::PhysicalStorageBufferAddressesEXT);1661}1662if (glslangIntermediate->usingVulkanMemoryModel()) {1663memoryModel = spv::MemoryModel::VulkanKHR;1664builder.addCapability(spv::Capability::VulkanMemoryModelKHR);1665builder.addIncorporatedExtension(spv::E_SPV_KHR_vulkan_memory_model, spv::Spv_1_5);1666}1667builder.setMemoryModel(addressingModel, memoryModel);16681669if (glslangIntermediate->usingVariablePointers()) {1670builder.addCapability(spv::Capability::VariablePointers);1671}16721673// If not linking, there is no entry point1674if (!options.compileOnly) {1675shaderEntry = builder.makeEntryPoint(glslangIntermediate->getEntryPointName().c_str());1676entryPoint =1677builder.addEntryPoint(executionModel, shaderEntry, glslangIntermediate->getEntryPointName().c_str());1678}16791680// Add the source extensions1681const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();1682for (auto it = sourceExtensions.begin(); it != sourceExtensions.end(); ++it)1683builder.addSourceExtension(it->c_str());16841685// Add the top-level modes for this shader.16861687if (glslangIntermediate->getXfbMode()) {1688builder.addCapability(spv::Capability::TransformFeedback);1689builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Xfb);1690}16911692if (glslangIntermediate->getLayoutPrimitiveCulling()) {1693builder.addCapability(spv::Capability::RayTraversalPrimitiveCullingKHR);1694}16951696if (glslangIntermediate->getSubgroupUniformControlFlow()) {1697builder.addExtension(spv::E_SPV_KHR_subgroup_uniform_control_flow);1698builder.addExecutionMode(shaderEntry, spv::ExecutionMode::SubgroupUniformControlFlowKHR);1699}1700if (glslangIntermediate->getMaximallyReconverges()) {1701builder.addExtension(spv::E_SPV_KHR_maximal_reconvergence);1702builder.addExecutionMode(shaderEntry, spv::ExecutionMode::MaximallyReconvergesKHR);1703}17041705if (glslangIntermediate->getQuadDerivMode())1706{1707builder.addCapability(spv::Capability::QuadControlKHR);1708builder.addExtension(spv::E_SPV_KHR_quad_control);1709builder.addExecutionMode(shaderEntry, spv::ExecutionMode::QuadDerivativesKHR);1710}17111712if (glslangIntermediate->getReqFullQuadsMode())1713{1714builder.addCapability(spv::Capability::QuadControlKHR);1715builder.addExtension(spv::E_SPV_KHR_quad_control);1716builder.addExecutionMode(shaderEntry, spv::ExecutionMode::RequireFullQuadsKHR);1717}17181719if (glslangIntermediate->usingShader64BitIndexing())1720{1721builder.addCapability(spv::Capability::Shader64BitIndexingEXT);1722builder.addExtension(spv::E_SPV_EXT_shader_64bit_indexing);1723builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Shader64BitIndexingEXT);1724}17251726spv::ExecutionMode mode;1727switch (glslangIntermediate->getStage()) {1728case EShLangVertex:1729builder.addCapability(spv::Capability::Shader);1730break;17311732case EShLangFragment:1733builder.addCapability(spv::Capability::Shader);1734if (glslangIntermediate->getPixelCenterInteger())1735builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PixelCenterInteger);17361737if (glslangIntermediate->getOriginUpperLeft())1738builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OriginUpperLeft);1739else1740builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OriginLowerLeft);17411742if (glslangIntermediate->getEarlyFragmentTests())1743builder.addExecutionMode(shaderEntry, spv::ExecutionMode::EarlyFragmentTests);17441745if (glslangIntermediate->getEarlyAndLateFragmentTestsAMD())1746{1747builder.addExecutionMode(shaderEntry, spv::ExecutionMode::EarlyAndLateFragmentTestsAMD);1748builder.addExtension(spv::E_SPV_AMD_shader_early_and_late_fragment_tests);1749}17501751if (glslangIntermediate->getPostDepthCoverage()) {1752builder.addCapability(spv::Capability::SampleMaskPostDepthCoverage);1753builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PostDepthCoverage);1754builder.addExtension(spv::E_SPV_KHR_post_depth_coverage);1755}17561757if (glslangIntermediate->getNonCoherentColorAttachmentReadEXT()) {1758builder.addCapability(spv::Capability::TileImageColorReadAccessEXT);1759builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentColorAttachmentReadEXT);1760builder.addExtension(spv::E_SPV_EXT_shader_tile_image);1761}17621763if (glslangIntermediate->getNonCoherentDepthAttachmentReadEXT()) {1764builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);1765builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentDepthAttachmentReadEXT);1766builder.addExtension(spv::E_SPV_EXT_shader_tile_image);1767}17681769if (glslangIntermediate->getNonCoherentStencilAttachmentReadEXT()) {1770builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);1771builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentStencilAttachmentReadEXT);1772builder.addExtension(spv::E_SPV_EXT_shader_tile_image);1773}17741775if (glslangIntermediate->getNonCoherentTileAttachmentReadQCOM()) {1776builder.addCapability(spv::Capability::TileShadingQCOM);1777builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentTileAttachmentReadQCOM);1778builder.addExtension(spv::E_SPV_QCOM_tile_shading);1779}17801781if (glslangIntermediate->isDepthReplacing())1782builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DepthReplacing);17831784if (glslangIntermediate->isStencilReplacing())1785builder.addExecutionMode(shaderEntry, spv::ExecutionMode::StencilRefReplacingEXT);17861787switch(glslangIntermediate->getDepth()) {1788case glslang::EldGreater: mode = spv::ExecutionMode::DepthGreater; break;1789case glslang::EldLess: mode = spv::ExecutionMode::DepthLess; break;1790case glslang::EldUnchanged: mode = spv::ExecutionMode::DepthUnchanged; break;1791default: mode = spv::ExecutionMode::Max; break;1792}17931794if (mode != spv::ExecutionMode::Max)1795builder.addExecutionMode(shaderEntry, mode);17961797switch (glslangIntermediate->getStencil()) {1798case glslang::ElsRefUnchangedFrontAMD: mode = spv::ExecutionMode::StencilRefUnchangedFrontAMD; break;1799case glslang::ElsRefGreaterFrontAMD: mode = spv::ExecutionMode::StencilRefGreaterFrontAMD; break;1800case glslang::ElsRefLessFrontAMD: mode = spv::ExecutionMode::StencilRefLessFrontAMD; break;1801case glslang::ElsRefUnchangedBackAMD: mode = spv::ExecutionMode::StencilRefUnchangedBackAMD; break;1802case glslang::ElsRefGreaterBackAMD: mode = spv::ExecutionMode::StencilRefGreaterBackAMD; break;1803case glslang::ElsRefLessBackAMD: mode = spv::ExecutionMode::StencilRefLessBackAMD; break;1804default: mode = spv::ExecutionMode::Max; break;1805}18061807if (mode != spv::ExecutionMode::Max)1808builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);1809switch (glslangIntermediate->getInterlockOrdering()) {1810case glslang::EioPixelInterlockOrdered: mode = spv::ExecutionMode::PixelInterlockOrderedEXT;1811break;1812case glslang::EioPixelInterlockUnordered: mode = spv::ExecutionMode::PixelInterlockUnorderedEXT;1813break;1814case glslang::EioSampleInterlockOrdered: mode = spv::ExecutionMode::SampleInterlockOrderedEXT;1815break;1816case glslang::EioSampleInterlockUnordered: mode = spv::ExecutionMode::SampleInterlockUnorderedEXT;1817break;1818case glslang::EioShadingRateInterlockOrdered: mode = spv::ExecutionMode::ShadingRateInterlockOrderedEXT;1819break;1820case glslang::EioShadingRateInterlockUnordered: mode = spv::ExecutionMode::ShadingRateInterlockUnorderedEXT;1821break;1822default: mode = spv::ExecutionMode::Max;1823break;1824}1825if (mode != spv::ExecutionMode::Max) {1826builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);1827if (mode == spv::ExecutionMode::ShadingRateInterlockOrderedEXT ||1828mode == spv::ExecutionMode::ShadingRateInterlockUnorderedEXT) {1829builder.addCapability(spv::Capability::FragmentShaderShadingRateInterlockEXT);1830} else if (mode == spv::ExecutionMode::PixelInterlockOrderedEXT ||1831mode == spv::ExecutionMode::PixelInterlockUnorderedEXT) {1832builder.addCapability(spv::Capability::FragmentShaderPixelInterlockEXT);1833} else {1834builder.addCapability(spv::Capability::FragmentShaderSampleInterlockEXT);1835}1836builder.addExtension(spv::E_SPV_EXT_fragment_shader_interlock);1837}1838break;18391840case EShLangCompute: {1841builder.addCapability(spv::Capability::Shader);1842bool needSizeId = false;1843for (int dim = 0; dim < 3; ++dim) {1844if ((glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet)) {1845needSizeId = true;1846break;1847}1848}1849if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6 && needSizeId) {1850std::vector<spv::Id> dimConstId;1851for (int dim = 0; dim < 3; ++dim) {1852bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);1853dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));1854if (specConst) {1855builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,1856glslangIntermediate->getLocalSizeSpecId(dim));1857needSizeId = true;1858}1859}1860builder.addExecutionModeId(shaderEntry, spv::ExecutionMode::LocalSizeId, dimConstId);1861} else {1862if (glslangIntermediate->getTileShadingRateQCOM(0) >= 1 || glslangIntermediate->getTileShadingRateQCOM(1) >= 1 || glslangIntermediate->getTileShadingRateQCOM(2) >= 1) {1863auto rate_x = glslangIntermediate->getTileShadingRateQCOM(0);1864auto rate_y = glslangIntermediate->getTileShadingRateQCOM(1);1865auto rate_z = glslangIntermediate->getTileShadingRateQCOM(2);1866rate_x = ( rate_x == 0 ? 1 : rate_x );1867rate_y = ( rate_y == 0 ? 1 : rate_y );1868rate_z = ( rate_z == 0 ? 1 : rate_z );1869builder.addExecutionMode(shaderEntry, spv::ExecutionMode::TileShadingRateQCOM, rate_x, rate_y, rate_z);1870} else {1871builder.addExecutionMode(shaderEntry, spv::ExecutionMode::LocalSize, glslangIntermediate->getLocalSize(0),1872glslangIntermediate->getLocalSize(1),1873glslangIntermediate->getLocalSize(2));1874}1875}1876if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupQuads) {1877builder.addCapability(spv::Capability::ComputeDerivativeGroupQuadsNV);1878builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DerivativeGroupQuadsNV);1879builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);1880} else if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupLinear) {1881builder.addCapability(spv::Capability::ComputeDerivativeGroupLinearNV);1882builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DerivativeGroupLinearNV);1883builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);1884}18851886if (glslangIntermediate->getNonCoherentTileAttachmentReadQCOM()) {1887builder.addCapability(spv::Capability::TileShadingQCOM);1888builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentTileAttachmentReadQCOM);1889builder.addExtension(spv::E_SPV_QCOM_tile_shading);1890}18911892break;1893}1894case EShLangTessEvaluation:1895case EShLangTessControl:1896builder.addCapability(spv::Capability::Tessellation);18971898glslang::TLayoutGeometry primitive;18991900if (glslangIntermediate->getStage() == EShLangTessControl) {1901builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices,1902glslangIntermediate->getVertices());1903primitive = glslangIntermediate->getOutputPrimitive();1904} else {1905primitive = glslangIntermediate->getInputPrimitive();1906}19071908switch (primitive) {1909case glslang::ElgTriangles: mode = spv::ExecutionMode::Triangles; break;1910case glslang::ElgQuads: mode = spv::ExecutionMode::Quads; break;1911case glslang::ElgIsolines: mode = spv::ExecutionMode::Isolines; break;1912default: mode = spv::ExecutionMode::Max; break;1913}1914if (mode != spv::ExecutionMode::Max)1915builder.addExecutionMode(shaderEntry, mode);19161917switch (glslangIntermediate->getVertexSpacing()) {1918case glslang::EvsEqual: mode = spv::ExecutionMode::SpacingEqual; break;1919case glslang::EvsFractionalEven: mode = spv::ExecutionMode::SpacingFractionalEven; break;1920case glslang::EvsFractionalOdd: mode = spv::ExecutionMode::SpacingFractionalOdd; break;1921default: mode = spv::ExecutionMode::Max; break;1922}1923if (mode != spv::ExecutionMode::Max)1924builder.addExecutionMode(shaderEntry, mode);19251926switch (glslangIntermediate->getVertexOrder()) {1927case glslang::EvoCw: mode = spv::ExecutionMode::VertexOrderCw; break;1928case glslang::EvoCcw: mode = spv::ExecutionMode::VertexOrderCcw; break;1929default: mode = spv::ExecutionMode::Max; break;1930}1931if (mode != spv::ExecutionMode::Max)1932builder.addExecutionMode(shaderEntry, mode);19331934if (glslangIntermediate->getPointMode())1935builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PointMode);1936break;19371938case EShLangGeometry:1939builder.addCapability(spv::Capability::Geometry);1940switch (glslangIntermediate->getInputPrimitive()) {1941case glslang::ElgPoints: mode = spv::ExecutionMode::InputPoints; break;1942case glslang::ElgLines: mode = spv::ExecutionMode::InputLines; break;1943case glslang::ElgLinesAdjacency: mode = spv::ExecutionMode::InputLinesAdjacency; break;1944case glslang::ElgTriangles: mode = spv::ExecutionMode::Triangles; break;1945case glslang::ElgTrianglesAdjacency: mode = spv::ExecutionMode::InputTrianglesAdjacency; break;1946default: mode = spv::ExecutionMode::Max; break;1947}1948if (mode != spv::ExecutionMode::Max)1949builder.addExecutionMode(shaderEntry, mode);19501951builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Invocations, glslangIntermediate->getInvocations());19521953switch (glslangIntermediate->getOutputPrimitive()) {1954case glslang::ElgPoints: mode = spv::ExecutionMode::OutputPoints; break;1955case glslang::ElgLineStrip: mode = spv::ExecutionMode::OutputLineStrip; break;1956case glslang::ElgTriangleStrip: mode = spv::ExecutionMode::OutputTriangleStrip; break;1957default: mode = spv::ExecutionMode::Max; break;1958}1959if (mode != spv::ExecutionMode::Max)1960builder.addExecutionMode(shaderEntry, mode);1961builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices, glslangIntermediate->getVertices());1962break;19631964case EShLangRayGen:1965case EShLangIntersect:1966case EShLangAnyHit:1967case EShLangClosestHit:1968case EShLangMiss:1969case EShLangCallable:1970{1971auto& extensions = glslangIntermediate->getRequestedExtensions();1972if (extensions.find("GL_EXT_opacity_micromap") != extensions.end()) {1973builder.addCapability(spv::Capability::RayTracingOpacityMicromapEXT);1974builder.addExtension("SPV_EXT_opacity_micromap");1975}1976if (extensions.find("GL_NV_ray_tracing") == extensions.end()) {1977builder.addCapability(spv::Capability::RayTracingKHR);1978builder.addExtension("SPV_KHR_ray_tracing");1979}1980else {1981builder.addCapability(spv::Capability::RayTracingNV);1982builder.addExtension("SPV_NV_ray_tracing");1983}1984if (glslangIntermediate->getStage() != EShLangRayGen && glslangIntermediate->getStage() != EShLangCallable) {1985if (extensions.find("GL_EXT_ray_cull_mask") != extensions.end()) {1986builder.addCapability(spv::Capability::RayCullMaskKHR);1987builder.addExtension("SPV_KHR_ray_cull_mask");1988}1989if (extensions.find("GL_EXT_ray_tracing_position_fetch") != extensions.end()) {1990builder.addCapability(spv::Capability::RayTracingPositionFetchKHR);1991builder.addExtension("SPV_KHR_ray_tracing_position_fetch");1992}1993}1994break;1995}1996case EShLangTask:1997case EShLangMesh:1998if(isMeshShaderExt) {1999builder.addCapability(spv::Capability::MeshShadingEXT);2000builder.addExtension(spv::E_SPV_EXT_mesh_shader);2001} else {2002builder.addCapability(spv::Capability::MeshShadingNV);2003builder.addExtension(spv::E_SPV_NV_mesh_shader);2004}2005if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {2006std::vector<spv::Id> dimConstId;2007for (int dim = 0; dim < 3; ++dim) {2008bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);2009dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));2010if (specConst) {2011builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,2012glslangIntermediate->getLocalSizeSpecId(dim));2013}2014}2015builder.addExecutionModeId(shaderEntry, spv::ExecutionMode::LocalSizeId, dimConstId);2016} else {2017builder.addExecutionMode(shaderEntry, spv::ExecutionMode::LocalSize, glslangIntermediate->getLocalSize(0),2018glslangIntermediate->getLocalSize(1),2019glslangIntermediate->getLocalSize(2));2020}2021if (glslangIntermediate->getStage() == EShLangMesh) {2022builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices,2023glslangIntermediate->getVertices());2024builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputPrimitivesNV,2025glslangIntermediate->getPrimitives());20262027switch (glslangIntermediate->getOutputPrimitive()) {2028case glslang::ElgPoints: mode = spv::ExecutionMode::OutputPoints; break;2029case glslang::ElgLines: mode = spv::ExecutionMode::OutputLinesNV; break;2030case glslang::ElgTriangles: mode = spv::ExecutionMode::OutputTrianglesNV; break;2031default: mode = spv::ExecutionMode::Max; break;2032}2033if (mode != spv::ExecutionMode::Max)2034builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);2035}2036break;20372038default:2039break;2040}20412042//2043// Add SPIR-V requirements (GL_EXT_spirv_intrinsics)2044//2045if (glslangIntermediate->hasSpirvRequirement()) {2046const glslang::TSpirvRequirement& spirvRequirement = glslangIntermediate->getSpirvRequirement();20472048// Add SPIR-V extension requirement2049for (auto& extension : spirvRequirement.extensions)2050builder.addExtension(extension.c_str());20512052// Add SPIR-V capability requirement2053for (auto capability : spirvRequirement.capabilities)2054builder.addCapability(static_cast<spv::Capability>(capability));2055}20562057//2058// Add SPIR-V execution mode qualifiers (GL_EXT_spirv_intrinsics)2059//2060if (glslangIntermediate->hasSpirvExecutionMode()) {2061const glslang::TSpirvExecutionMode spirvExecutionMode = glslangIntermediate->getSpirvExecutionMode();20622063// Add spirv_execution_mode2064for (auto& mode : spirvExecutionMode.modes) {2065if (!mode.second.empty()) {2066std::vector<unsigned> literals;2067TranslateLiterals(mode.second, literals);2068builder.addExecutionMode(shaderEntry, static_cast<spv::ExecutionMode>(mode.first), literals);2069} else2070builder.addExecutionMode(shaderEntry, static_cast<spv::ExecutionMode>(mode.first));2071}20722073// Add spirv_execution_mode_id2074for (auto& modeId : spirvExecutionMode.modeIds) {2075std::vector<spv::Id> operandIds;2076assert(!modeId.second.empty());2077for (auto extraOperand : modeId.second) {2078if (extraOperand->getType().getQualifier().isSpecConstant())2079operandIds.push_back(getSymbolId(extraOperand->getAsSymbolNode()));2080else2081operandIds.push_back(createSpvConstant(*extraOperand));2082}2083builder.addExecutionModeId(shaderEntry, static_cast<spv::ExecutionMode>(modeId.first), operandIds);2084}2085}2086}20872088// Finish creating SPV, after the traversal is complete.2089void TGlslangToSpvTraverser::finishSpv(bool compileOnly)2090{2091// If not linking, an entry point is not expected2092if (!compileOnly) {2093// Finish the entry point function2094if (!entryPointTerminated) {2095builder.setBuildPoint(shaderEntry->getLastBlock());2096builder.leaveFunction();2097}20982099// finish off the entry-point SPV instruction by adding the Input/Output <id>2100entryPoint->reserveOperands(iOSet.size());2101for (auto id : iOSet)2102entryPoint->addIdOperand(id);2103}21042105// Add capabilities, extensions, remove unneeded decorations, etc.,2106// based on the resulting SPIR-V.2107// Note: WebGPU code generation must have the opportunity to aggressively2108// prune unreachable merge blocks and continue targets.2109builder.postProcess(compileOnly);2110}21112112// Write the SPV into 'out'.2113void TGlslangToSpvTraverser::dumpSpv(std::vector<unsigned int>& out)2114{2115builder.dump(out);2116}21172118//2119// Implement the traversal functions.2120//2121// Return true from interior nodes to have the external traversal2122// continue on to children. Return false if children were2123// already processed.2124//21252126//2127// Symbols can turn into2128// - uniform/input reads2129// - output writes2130// - complex lvalue base setups: foo.bar[3].... , where we see foo and start up an access chain2131// - something simple that degenerates into the last bullet2132//2133void TGlslangToSpvTraverser::visitSymbol(glslang::TIntermSymbol* symbol)2134{2135// We update the line information even though no code might be generated here2136// This is helpful to yield correct lines for control flow instructions2137if (!linkageOnly) {2138builder.setDebugSourceLocation(symbol->getLoc().line, symbol->getLoc().getFilename());2139}21402141if (symbol->getBasicType() == glslang::EbtFunction) {2142return;2143}21442145SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);2146if (symbol->getType().isStruct())2147glslangTypeToIdMap[symbol->getType().getStruct()] = symbol->getId();21482149if (symbol->getType().getQualifier().isSpecConstant())2150spec_constant_op_mode_setter.turnOnSpecConstantOpMode();2151#ifdef ENABLE_HLSL2152// Skip symbol handling if it is string-typed2153if (symbol->getBasicType() == glslang::EbtString)2154return;2155#endif21562157// getSymbolId() will set up all the IO decorations on the first call.2158// Formal function parameters were mapped during makeFunctions().2159spv::Id id = getSymbolId(symbol);21602161if (symbol->getType().getQualifier().isTaskPayload())2162taskPayloadID = id; // cache the taskPayloadID to be used it as operand for OpEmitMeshTasksEXT21632164if (builder.isPointer(id)) {2165if (!symbol->getType().getQualifier().isParamInput() &&2166!symbol->getType().getQualifier().isParamOutput()) {2167// Include all "static use" and "linkage only" interface variables on the OpEntryPoint instruction2168// Consider adding to the OpEntryPoint interface list.2169// Only looking at structures if they have at least one member.2170if (!symbol->getType().isStruct() || symbol->getType().getStruct()->size() > 0) {2171spv::StorageClass sc = builder.getStorageClass(id);2172// Before SPIR-V 1.4, we only want to include Input and Output.2173// Starting with SPIR-V 1.4, we want all globals.2174if ((glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4 && builder.isGlobalVariable(id)) ||2175(sc == spv::StorageClass::Input || sc == spv::StorageClass::Output)) {2176iOSet.insert(id);2177}2178}2179}21802181// If the SPIR-V type is required to be different than the AST type2182// (for ex SubgroupMasks or 3x4 ObjectToWorld/WorldToObject matrices),2183// translate now from the SPIR-V type to the AST type, for the consuming2184// operation.2185// Note this turns it from an l-value to an r-value.2186// Currently, all symbols needing this are inputs; avoid the map lookup when non-input.2187if (symbol->getType().getQualifier().storage == glslang::EvqVaryingIn)2188id = translateForcedType(id);2189}21902191// Only process non-linkage-only nodes for generating actual static uses2192if (! linkageOnly || symbol->getQualifier().isSpecConstant()) {2193// Prepare to generate code for the access21942195// L-value chains will be computed left to right. We're on the symbol now,2196// which is the left-most part of the access chain, so now is "clear" time,2197// followed by setting the base.2198builder.clearAccessChain();21992200// For now, we consider all user variables as being in memory, so they are pointers,2201// except for2202// A) R-Value arguments to a function, which are an intermediate object.2203// See comments in handleUserFunctionCall().2204// B) Specialization constants (normal constants don't even come in as a variable),2205// These are also pure R-values.2206// C) R-Values from type translation, see above call to translateForcedType()2207glslang::TQualifier qualifier = symbol->getQualifier();2208if (qualifier.isSpecConstant() || rValueParameters.find(symbol->getId()) != rValueParameters.end() ||2209!builder.isPointerType(builder.getTypeId(id)))2210builder.setAccessChainRValue(id);2211else2212builder.setAccessChainLValue(id);2213}22142215#ifdef ENABLE_HLSL2216// Process linkage-only nodes for any special additional interface work.2217if (linkageOnly) {2218if (glslangIntermediate->getHlslFunctionality1()) {2219// Map implicit counter buffers to their originating buffers, which should have been2220// seen by now, given earlier pruning of unused counters, and preservation of order2221// of declaration.2222if (symbol->getType().getQualifier().isUniformOrBuffer()) {2223if (!glslangIntermediate->hasCounterBufferName(symbol->getName())) {2224// Save possible originating buffers for counter buffers, keyed by2225// making the potential counter-buffer name.2226std::string keyName = symbol->getName().c_str();2227keyName = glslangIntermediate->addCounterBufferName(keyName);2228counterOriginator[keyName] = symbol;2229} else {2230// Handle a counter buffer, by finding the saved originating buffer.2231std::string keyName = symbol->getName().c_str();2232auto it = counterOriginator.find(keyName);2233if (it != counterOriginator.end()) {2234id = getSymbolId(it->second);2235if (id != spv::NoResult) {2236spv::Id counterId = getSymbolId(symbol);2237if (counterId != spv::NoResult) {2238builder.addExtension("SPV_GOOGLE_hlsl_functionality1");2239builder.addDecorationId(id, spv::Decoration::HlslCounterBufferGOOGLE, counterId);2240}2241}2242}2243}2244}2245}2246}2247#endif2248}22492250bool TGlslangToSpvTraverser::visitBinary(glslang::TVisit /* visit */, glslang::TIntermBinary* node)2251{2252builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());2253if (node->getLeft()->getAsSymbolNode() != nullptr && node->getLeft()->getType().isStruct()) {2254glslangTypeToIdMap[node->getLeft()->getType().getStruct()] = node->getLeft()->getAsSymbolNode()->getId();2255}2256if (node->getRight()->getAsSymbolNode() != nullptr && node->getRight()->getType().isStruct()) {2257glslangTypeToIdMap[node->getRight()->getType().getStruct()] = node->getRight()->getAsSymbolNode()->getId();2258}22592260SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);2261if (node->getType().getQualifier().isSpecConstant())2262spec_constant_op_mode_setter.turnOnSpecConstantOpMode();22632264// First, handle special cases2265switch (node->getOp()) {2266case glslang::EOpAssign:2267case glslang::EOpAddAssign:2268case glslang::EOpSubAssign:2269case glslang::EOpMulAssign:2270case glslang::EOpVectorTimesMatrixAssign:2271case glslang::EOpVectorTimesScalarAssign:2272case glslang::EOpMatrixTimesScalarAssign:2273case glslang::EOpMatrixTimesMatrixAssign:2274case glslang::EOpDivAssign:2275case glslang::EOpModAssign:2276case glslang::EOpAndAssign:2277case glslang::EOpInclusiveOrAssign:2278case glslang::EOpExclusiveOrAssign:2279case glslang::EOpLeftShiftAssign:2280case glslang::EOpRightShiftAssign:2281// A bin-op assign "a += b" means the same thing as "a = a + b"2282// where a is evaluated before b. For a simple assignment, GLSL2283// says to evaluate the left before the right. So, always, left2284// node then right node.2285{2286// get the left l-value, save it away2287builder.clearAccessChain();2288node->getLeft()->traverse(this);2289spv::Builder::AccessChain lValue = builder.getAccessChain();22902291// evaluate the right2292builder.clearAccessChain();2293node->getRight()->traverse(this);2294spv::Id rValue = accessChainLoad(node->getRight()->getType());22952296// reset line number for assignment2297builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());22982299if (node->getOp() != glslang::EOpAssign) {2300// the left is also an r-value2301builder.setAccessChain(lValue);2302spv::Id leftRValue = accessChainLoad(node->getLeft()->getType());23032304// do the operation2305spv::Builder::AccessChain::CoherentFlags coherentFlags = TranslateCoherent(node->getLeft()->getType());2306coherentFlags |= TranslateCoherent(node->getRight()->getType());2307OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),2308TranslateNoContractionDecoration(node->getType().getQualifier()),2309TranslateNonUniformDecoration(coherentFlags) };2310rValue = createBinaryOperation(node->getOp(), decorations,2311convertGlslangToSpvType(node->getType()), leftRValue, rValue,2312node->getType().getBasicType());23132314// these all need their counterparts in createBinaryOperation()2315assert(rValue != spv::NoResult);2316}23172318// store the result2319builder.setAccessChain(lValue);2320multiTypeStore(node->getLeft()->getType(), rValue);23212322// assignments are expressions having an rValue after they are evaluated...2323builder.clearAccessChain();2324builder.setAccessChainRValue(rValue);2325}2326return false;2327case glslang::EOpIndexDirect:2328case glslang::EOpIndexDirectStruct:2329{2330// Structure, array, matrix, or vector indirection with statically known index.2331// Get the left part of the access chain.2332node->getLeft()->traverse(this);23332334// Add the next element in the chain23352336const int glslangIndex = node->getRight()->getAsConstantUnion()->getConstArray()[0].getIConst();2337if (! node->getLeft()->getType().isArray() &&2338node->getLeft()->getType().isVector() &&2339node->getOp() == glslang::EOpIndexDirect) {2340// Swizzle is uniform so propagate uniform into access chain2341spv::Builder::AccessChain::CoherentFlags coherentFlags = TranslateCoherent(node->getLeft()->getType());2342coherentFlags.nonUniform = 0;2343// This is essentially a hard-coded vector swizzle of size 1,2344// so short circuit the access-chain stuff with a swizzle.2345std::vector<unsigned> swizzle;2346swizzle.push_back(glslangIndex);2347int dummySize;2348builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),2349coherentFlags,2350glslangIntermediate->getBaseAlignmentScalar(2351node->getLeft()->getType(), dummySize));2352} else {23532354// Load through a block reference is performed with a dot operator that2355// is mapped to EOpIndexDirectStruct. When we get to the actual reference,2356// do a load and reset the access chain.2357if (node->getLeft()->isReference() &&2358!node->getLeft()->getType().isArray() &&2359node->getOp() == glslang::EOpIndexDirectStruct)2360{2361spv::Id left = accessChainLoad(node->getLeft()->getType());2362builder.clearAccessChain();2363builder.setAccessChainLValue(left);2364}23652366int spvIndex = glslangIndex;2367if (node->getLeft()->getBasicType() == glslang::EbtBlock &&2368node->getOp() == glslang::EOpIndexDirectStruct)2369{2370// This may be, e.g., an anonymous block-member selection, which generally need2371// index remapping due to hidden members in anonymous blocks.2372long long glslangId = glslangTypeToIdMap[node->getLeft()->getType().getStruct()];2373if (memberRemapper.find(glslangId) != memberRemapper.end()) {2374std::vector<int>& remapper = memberRemapper[glslangId];2375assert(remapper.size() > 0);2376spvIndex = remapper[glslangIndex];2377}2378}23792380// Struct reference propagates uniform lvalue2381spv::Builder::AccessChain::CoherentFlags coherentFlags =2382TranslateCoherent(node->getLeft()->getType());2383coherentFlags.nonUniform = 0;23842385// normal case for indexing array or structure or block2386if ((node->getRight()->getType().getBasicType() == glslang::EbtUint && glslangIntermediate->usingPromoteUint32Indices()) ||2387node->getRight()->getType().contains64BitInt()) {2388int64_t idx = node->getRight()->getType().contains64BitInt() ?2389node->getRight()->getAsConstantUnion()->getConstArray()[0].getI64Const() :2390node->getRight()->getAsConstantUnion()->getConstArray()[0].getUConst();2391builder.accessChainPush(builder.makeInt64Constant(idx),2392coherentFlags,2393node->getLeft()->getType().getBufferReferenceAlignment());23942395} else {2396builder.accessChainPush(builder.makeIntConstant(spvIndex),2397coherentFlags,2398node->getLeft()->getType().getBufferReferenceAlignment());2399}2400// Add capabilities here for accessing PointSize and clip/cull distance.2401// We have deferred generation of associated capabilities until now.2402if (node->getLeft()->getType().isStruct() && ! node->getLeft()->getType().isArray())2403declareUseOfStructMember(*(node->getLeft()->getType().getStruct()), glslangIndex);2404}2405}2406return false;2407case glslang::EOpIndexIndirect:2408{2409// Array, matrix, or vector indirection with variable index.2410// Will use native SPIR-V access-chain for and array indirection;2411// matrices are arrays of vectors, so will also work for a matrix.2412// Will use the access chain's 'component' for variable index into a vector.24132414// This adapter is building access chains left to right.2415// Set up the access chain to the left.2416node->getLeft()->traverse(this);24172418// save it so that computing the right side doesn't trash it2419spv::Builder::AccessChain partial = builder.getAccessChain();24202421// compute the next index in the chain2422builder.clearAccessChain();2423node->getRight()->traverse(this);2424spv::Id index = accessChainLoad(node->getRight()->getType());24252426// Zero-extend smaller unsigned integer types for array indexing.2427// SPIR-V OpAccessChain treats indices as signed, so we need to zero-extend2428// unsigned types to preserve their values (signed types are fine as-is).2429spv::Id indexType = builder.getTypeId(index);2430if (builder.isUintType(indexType) && builder.getScalarTypeWidth(indexType) < 32) {2431// Zero-extend unsigned types to preserve their values2432spv::Id uintType = builder.makeUintType(32);2433index = builder.createUnaryOp(spv::Op::OpUConvert, uintType, index);2434}24352436addIndirectionIndexCapabilities(node->getLeft()->getType(), node->getRight()->getType());24372438// restore the saved access chain2439builder.setAccessChain(partial);24402441// Only if index is nonUniform should we propagate nonUniform into access chain2442spv::Builder::AccessChain::CoherentFlags index_flags = TranslateCoherent(node->getRight()->getType());2443spv::Builder::AccessChain::CoherentFlags coherent_flags = TranslateCoherent(node->getLeft()->getType());2444coherent_flags.nonUniform = index_flags.nonUniform;24452446if (! node->getLeft()->getType().isArray() && node->getLeft()->getType().isVector()) {2447int dummySize;2448builder.accessChainPushComponent(2449index, convertGlslangToSpvType(node->getLeft()->getType()), coherent_flags,2450glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(),2451dummySize));2452} else {2453if (glslangIntermediate->usingPromoteUint32Indices() &&2454node->getRight()->getType().getBasicType() == glslang::EbtUint) {2455index = createIntWidthConversion(index, 0, builder.makeIntegerType(64, true), glslang::EbtInt64, node->getRight()->getType().getBasicType());2456}24572458builder.accessChainPush(index, coherent_flags,2459node->getLeft()->getType().getBufferReferenceAlignment());2460}2461}2462return false;2463case glslang::EOpVectorSwizzle:2464{2465node->getLeft()->traverse(this);2466std::vector<unsigned> swizzle;2467convertSwizzle(*node->getRight()->getAsAggregate(), swizzle);2468int dummySize;2469builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),2470TranslateCoherent(node->getLeft()->getType()),2471glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(),2472dummySize));2473}2474return false;2475case glslang::EOpMatrixSwizzle:2476logger->missingFunctionality("matrix swizzle");2477return true;2478case glslang::EOpLogicalOr:2479case glslang::EOpLogicalAnd:2480{24812482// These may require short circuiting, but can sometimes be done as straight2483// binary operations. The right operand must be short circuited if it has2484// side effects, and should probably be if it is complex.2485if (isTrivial(node->getRight()->getAsTyped()))2486break; // handle below as a normal binary operation2487// otherwise, we need to do dynamic short circuiting on the right operand2488spv::Id result = createShortCircuit(node->getOp(), *node->getLeft()->getAsTyped(),2489*node->getRight()->getAsTyped());2490builder.clearAccessChain();2491builder.setAccessChainRValue(result);2492}2493return false;2494default:2495break;2496}24972498// Assume generic binary op...24992500// get right operand2501builder.clearAccessChain();2502node->getLeft()->traverse(this);2503spv::Id left = accessChainLoad(node->getLeft()->getType());25042505// get left operand2506builder.clearAccessChain();2507node->getRight()->traverse(this);2508spv::Id right = accessChainLoad(node->getRight()->getType());25092510// get result2511OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),2512TranslateNoContractionDecoration(node->getType().getQualifier()),2513TranslateNonUniformDecoration(node->getType().getQualifier()) };2514spv::Id result = createBinaryOperation(node->getOp(), decorations,2515convertGlslangToSpvType(node->getType()), left, right,2516node->getLeft()->getType().getBasicType());25172518builder.clearAccessChain();2519if (! result) {2520logger->missingFunctionality("unknown glslang binary operation");2521return true; // pick up a child as the place-holder result2522} else {2523builder.setAccessChainRValue(result);2524return false;2525}2526}25272528spv::Id TGlslangToSpvTraverser::convertLoadedBoolInUniformToUint(const glslang::TType& type,2529spv::Id nominalTypeId,2530spv::Id loadedId)2531{2532if (builder.isScalarType(nominalTypeId)) {2533// Conversion for bool2534spv::Id boolType = builder.makeBoolType();2535if (nominalTypeId != boolType)2536return builder.createBinOp(spv::Op::OpINotEqual, boolType, loadedId, builder.makeUintConstant(0));2537} else if (builder.isVectorType(nominalTypeId)) {2538// Conversion for bvec2539int vecSize = builder.getNumTypeComponents(nominalTypeId);2540spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);2541if (nominalTypeId != bvecType)2542loadedId = builder.createBinOp(spv::Op::OpINotEqual, bvecType, loadedId,2543makeSmearedConstant(builder.makeUintConstant(0), vecSize));2544} else if (builder.isArrayType(nominalTypeId)) {2545// Conversion for bool array2546spv::Id boolArrayTypeId = convertGlslangToSpvType(type);2547if (nominalTypeId != boolArrayTypeId)2548{2549// Use OpCopyLogical from SPIR-V 1.4 if available.2550if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4)2551return builder.createUnaryOp(spv::Op::OpCopyLogical, boolArrayTypeId, loadedId);25522553glslang::TType glslangElementType(type, 0);2554spv::Id elementNominalTypeId = builder.getContainedTypeId(nominalTypeId);2555std::vector<spv::Id> constituents;2556for (int index = 0; index < type.getOuterArraySize(); ++index) {2557// get the element2558spv::Id elementValue = builder.createCompositeExtract(loadedId, elementNominalTypeId, index);25592560// recursively convert it2561spv::Id elementConvertedValue = convertLoadedBoolInUniformToUint(glslangElementType, elementNominalTypeId, elementValue);2562constituents.push_back(elementConvertedValue);2563}2564return builder.createCompositeConstruct(boolArrayTypeId, constituents);2565}2566}25672568return loadedId;2569}25702571// Figure out what, if any, type changes are needed when accessing a specific built-in.2572// Returns <the type SPIR-V requires for declarion, the type to translate to on use>.2573// Also see comment for 'forceType', regarding tracking SPIR-V-required types.2574std::pair<spv::Id, spv::Id> TGlslangToSpvTraverser::getForcedType(glslang::TBuiltInVariable glslangBuiltIn,2575const glslang::TType& glslangType)2576{2577switch(glslangBuiltIn)2578{2579case glslang::EbvSubGroupEqMask:2580case glslang::EbvSubGroupGeMask:2581case glslang::EbvSubGroupGtMask:2582case glslang::EbvSubGroupLeMask:2583case glslang::EbvSubGroupLtMask: {2584// these require changing a 64-bit scaler -> a vector of 32-bit components2585if (glslangType.isVector())2586break;2587spv::Id ivec4_type = builder.makeVectorType(builder.makeUintType(32), 4);2588spv::Id uint64_type = builder.makeUintType(64);2589std::pair<spv::Id, spv::Id> ret(ivec4_type, uint64_type);2590return ret;2591}2592// There are no SPIR-V builtins defined for these and map onto original non-transposed2593// builtins. During visitBinary we insert a transpose2594case glslang::EbvWorldToObject3x4:2595case glslang::EbvObjectToWorld3x4: {2596spv::Id mat43 = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);2597spv::Id mat34 = builder.makeMatrixType(builder.makeFloatType(32), 3, 4);2598std::pair<spv::Id, spv::Id> ret(mat43, mat34);2599return ret;2600}2601default:2602break;2603}26042605std::pair<spv::Id, spv::Id> ret(spv::NoType, spv::NoType);2606return ret;2607}26082609// For an object previously identified (see getForcedType() and forceType)2610// as needing type translations, do the translation needed for a load, turning2611// an L-value into in R-value.2612spv::Id TGlslangToSpvTraverser::translateForcedType(spv::Id object)2613{2614const auto forceIt = forceType.find(object);2615if (forceIt == forceType.end())2616return object;26172618spv::Id desiredTypeId = forceIt->second;2619spv::Id objectTypeId = builder.getTypeId(object);2620assert(builder.isPointerType(objectTypeId));2621objectTypeId = builder.getContainedTypeId(objectTypeId);2622if (builder.isVectorType(objectTypeId) &&2623builder.getScalarTypeWidth(builder.getContainedTypeId(objectTypeId)) == 32) {2624if (builder.getScalarTypeWidth(desiredTypeId) == 64) {2625// handle 32-bit v.xy* -> 64-bit2626builder.clearAccessChain();2627builder.setAccessChainLValue(object);2628object = builder.accessChainLoad(spv::NoPrecision, spv::Decoration::Max, spv::Decoration::Max, objectTypeId);2629std::vector<spv::Id> components;2630components.push_back(builder.createCompositeExtract(object, builder.getContainedTypeId(objectTypeId), 0));2631components.push_back(builder.createCompositeExtract(object, builder.getContainedTypeId(objectTypeId), 1));26322633spv::Id vecType = builder.makeVectorType(builder.getContainedTypeId(objectTypeId), 2);2634return builder.createUnaryOp(spv::Op::OpBitcast, desiredTypeId,2635builder.createCompositeConstruct(vecType, components));2636} else {2637logger->missingFunctionality("forcing 32-bit vector type to non 64-bit scalar");2638}2639} else if (builder.isMatrixType(objectTypeId)) {2640// There are no SPIR-V builtins defined for 3x4 variants of ObjectToWorld/WorldToObject2641// and we insert a transpose after loading the original non-transposed builtins2642builder.clearAccessChain();2643builder.setAccessChainLValue(object);2644object = builder.accessChainLoad(spv::NoPrecision, spv::Decoration::Max, spv::Decoration::Max, objectTypeId);2645return builder.createUnaryOp(spv::Op::OpTranspose, desiredTypeId, object);26462647} else {2648logger->missingFunctionality("forcing non 32-bit vector type");2649}26502651return object;2652}26532654bool TGlslangToSpvTraverser::visitUnary(glslang::TVisit /* visit */, glslang::TIntermUnary* node)2655{2656builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());26572658SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);2659if (node->getType().getQualifier().isSpecConstant())2660spec_constant_op_mode_setter.turnOnSpecConstantOpMode();26612662spv::Id result = spv::NoResult;26632664// try texturing first2665result = createImageTextureFunctionCall(node);2666if (result != spv::NoResult) {2667builder.clearAccessChain();2668builder.setAccessChainRValue(result);26692670return false; // done with this node2671}26722673// Non-texturing.26742675if (node->getOp() == glslang::EOpArrayLength) {2676// Quite special; won't want to evaluate the operand.26772678// Currently, the front-end does not allow .length() on an array until it is sized,2679// except for the last block membeor of an SSBO.2680// TODO: If this changes, link-time sized arrays might show up here, and need their2681// size extracted.26822683// Normal .length() would have been constant folded by the front-end.2684// So, this has to be block.lastMember.length().2685// SPV wants "block" and member number as the operands, go get them.26862687uint32_t bits = node->getType().contains64BitInt() ? 64 : 32;26882689spv::Id length;2690if (node->getOperand()->getType().isCoopMat()) {2691spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());2692assert(builder.isCooperativeMatrixType(typeId));26932694if (node->getOperand()->getType().isCoopMatKHR()) {2695length = builder.createCooperativeMatrixLengthKHR(typeId);2696} else {2697spec_constant_op_mode_setter.turnOnSpecConstantOpMode();2698length = builder.createCooperativeMatrixLengthNV(typeId);2699}2700} else if (node->getOperand()->getType().isCoopVecNV()) {2701spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());2702length = builder.getCooperativeVectorNumComponents(typeId);2703} else {2704glslang::TIntermTyped* block = node->getOperand()->getAsBinaryNode()->getLeft();2705block->traverse(this);2706unsigned int member = node->getOperand()->getAsBinaryNode()->getRight()->getAsConstantUnion()2707->getConstArray()[0].getUConst();2708length = builder.createArrayLength(builder.accessChainGetLValue(), member, bits);2709}27102711// GLSL semantics say the result of .length() is an int, while SPIR-V says2712// signedness must be 0. So, convert from SPIR-V unsigned back to GLSL's2713// AST expectation of a signed result.2714if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {2715if (builder.isInSpecConstCodeGenMode()) {2716length = builder.createBinOp(spv::Op::OpIAdd, builder.makeIntType(bits), length, builder.makeIntConstant(0));2717} else {2718length = builder.createUnaryOp(spv::Op::OpBitcast, builder.makeIntType(bits), length);2719}2720}27212722builder.clearAccessChain();2723builder.setAccessChainRValue(length);27242725return false;2726}27272728// Force variable declaration - Debug Mode Only2729if (node->getOp() == glslang::EOpDeclare) {2730builder.clearAccessChain();2731node->getOperand()->traverse(this);2732builder.clearAccessChain();2733return false;2734}27352736// Start by evaluating the operand27372738// Does it need a swizzle inversion? If so, evaluation is inverted;2739// operate first on the swizzle base, then apply the swizzle.2740spv::Id invertedType = spv::NoType;2741auto resultType = [&invertedType, &node, this](){ return invertedType != spv::NoType ?2742invertedType : convertGlslangToSpvType(node->getType()); };2743if (node->getOp() == glslang::EOpInterpolateAtCentroid)2744invertedType = getInvertedSwizzleType(*node->getOperand());27452746builder.clearAccessChain();2747TIntermNode *operandNode;2748if (invertedType != spv::NoType)2749operandNode = node->getOperand()->getAsBinaryNode()->getLeft();2750else2751operandNode = node->getOperand();27522753operandNode->traverse(this);27542755spv::Id operand = spv::NoResult;27562757spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;27582759const auto hitObjectOpsWithLvalue = [](glslang::TOperator op) {2760switch(op) {2761case glslang::EOpReorderThreadNV:2762case glslang::EOpHitObjectGetCurrentTimeNV:2763case glslang::EOpHitObjectGetHitKindNV:2764case glslang::EOpHitObjectGetPrimitiveIndexNV:2765case glslang::EOpHitObjectGetGeometryIndexNV:2766case glslang::EOpHitObjectGetInstanceIdNV:2767case glslang::EOpHitObjectGetInstanceCustomIndexNV:2768case glslang::EOpHitObjectGetObjectRayDirectionNV:2769case glslang::EOpHitObjectGetObjectRayOriginNV:2770case glslang::EOpHitObjectGetWorldRayDirectionNV:2771case glslang::EOpHitObjectGetWorldRayOriginNV:2772case glslang::EOpHitObjectGetWorldToObjectNV:2773case glslang::EOpHitObjectGetObjectToWorldNV:2774case glslang::EOpHitObjectGetRayTMaxNV:2775case glslang::EOpHitObjectGetRayTMinNV:2776case glslang::EOpHitObjectIsEmptyNV:2777case glslang::EOpHitObjectIsHitNV:2778case glslang::EOpHitObjectIsMissNV:2779case glslang::EOpHitObjectRecordEmptyNV:2780case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:2781case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:2782case glslang::EOpHitObjectGetClusterIdNV:2783case glslang::EOpHitObjectGetSpherePositionNV:2784case glslang::EOpHitObjectGetSphereRadiusNV:2785case glslang::EOpHitObjectIsSphereHitNV:2786case glslang::EOpHitObjectIsLSSHitNV:2787case glslang::EOpReorderThreadEXT:2788case glslang::EOpHitObjectGetCurrentTimeEXT:2789case glslang::EOpHitObjectGetHitKindEXT:2790case glslang::EOpHitObjectGetPrimitiveIndexEXT:2791case glslang::EOpHitObjectGetGeometryIndexEXT:2792case glslang::EOpHitObjectGetInstanceIdEXT:2793case glslang::EOpHitObjectGetInstanceCustomIndexEXT:2794case glslang::EOpHitObjectGetObjectRayDirectionEXT:2795case glslang::EOpHitObjectGetObjectRayOriginEXT:2796case glslang::EOpHitObjectGetWorldRayDirectionEXT:2797case glslang::EOpHitObjectGetWorldRayOriginEXT:2798case glslang::EOpHitObjectGetWorldToObjectEXT:2799case glslang::EOpHitObjectGetObjectToWorldEXT:2800case glslang::EOpHitObjectGetRayTMaxEXT:2801case glslang::EOpHitObjectGetRayTMinEXT:2802case glslang::EOpHitObjectGetRayFlagsEXT:2803case glslang::EOpHitObjectIsEmptyEXT:2804case glslang::EOpHitObjectIsHitEXT:2805case glslang::EOpHitObjectIsMissEXT:2806case glslang::EOpHitObjectRecordEmptyEXT:2807case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:2808case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:2809return true;2810default:2811return false;2812}2813};28142815if (node->getOp() == glslang::EOpAtomicCounterIncrement ||2816node->getOp() == glslang::EOpAtomicCounterDecrement ||2817node->getOp() == glslang::EOpAtomicCounter ||2818(node->getOp() == glslang::EOpInterpolateAtCentroid &&2819glslangIntermediate->getSource() != glslang::EShSourceHlsl) ||2820node->getOp() == glslang::EOpRayQueryProceed ||2821node->getOp() == glslang::EOpRayQueryGetRayTMin ||2822node->getOp() == glslang::EOpRayQueryGetRayFlags ||2823node->getOp() == glslang::EOpRayQueryGetWorldRayOrigin ||2824node->getOp() == glslang::EOpRayQueryGetWorldRayDirection ||2825node->getOp() == glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque ||2826node->getOp() == glslang::EOpRayQueryTerminate ||2827node->getOp() == glslang::EOpRayQueryConfirmIntersection ||2828(node->getOp() == glslang::EOpSpirvInst && operandNode->getAsTyped()->getQualifier().isSpirvByReference()) ||2829hitObjectOpsWithLvalue(node->getOp())) {2830operand = builder.accessChainGetLValue(); // Special case l-value operands2831lvalueCoherentFlags = builder.getAccessChain().coherentFlags;2832lvalueCoherentFlags |= TranslateCoherent(operandNode->getAsTyped()->getType());2833} else if (operandNode->getAsTyped()->getQualifier().isSpirvLiteral()) {2834// Will be translated to a literal value, make a placeholder here2835operand = spv::NoResult;2836} else {2837operand = accessChainLoad(node->getOperand()->getType());2838}28392840OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),2841TranslateNoContractionDecoration(node->getType().getQualifier()),2842TranslateNonUniformDecoration(node->getType().getQualifier()) };28432844// it could be a conversion2845if (! result) {2846result = createConversion(node->getOp(), decorations, resultType(), operand,2847node->getType().getBasicType(), node->getOperand()->getBasicType());2848if (result) {2849if (node->getType().isCoopMatKHR() && node->getOperand()->getAsTyped()->getType().isCoopMatKHR() &&2850!node->getAsTyped()->getType().sameCoopMatUse(node->getOperand()->getAsTyped()->getType())) {2851// Conversions that change use need CapabilityCooperativeMatrixConversionsNV2852builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);2853builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);2854}2855}2856}28572858// if not, then possibly an operation2859if (! result)2860result = createUnaryOperation(node->getOp(), decorations, resultType(), operand,2861node->getOperand()->getBasicType(), lvalueCoherentFlags, node->getType());28622863// it could be attached to a SPIR-V intruction2864if (!result) {2865if (node->getOp() == glslang::EOpSpirvInst) {2866const auto& spirvInst = node->getSpirvInstruction();2867if (spirvInst.set == "") {2868spv::IdImmediate idImmOp = {true, operand};2869if (operandNode->getAsTyped()->getQualifier().isSpirvLiteral()) {2870// Translate the constant to a literal value2871std::vector<unsigned> literals;2872glslang::TVector<const glslang::TIntermConstantUnion*> constants;2873constants.push_back(operandNode->getAsConstantUnion());2874TranslateLiterals(constants, literals);2875idImmOp = {false, literals[0]};2876}28772878if (node->getBasicType() == glslang::EbtVoid)2879builder.createNoResultOp(static_cast<spv::Op>(spirvInst.id), {idImmOp});2880else2881result = builder.createOp(static_cast<spv::Op>(spirvInst.id), resultType(), {idImmOp});2882} else {2883result = builder.createBuiltinCall(2884resultType(), spirvInst.set == "GLSL.std.450" ? stdBuiltins : getExtBuiltins(spirvInst.set.c_str()),2885spirvInst.id, {operand});2886}28872888if (node->getBasicType() == glslang::EbtVoid)2889return false; // done with this node2890}2891}28922893if (result) {2894if (invertedType) {2895result = createInvertedSwizzle(decorations.precision, *node->getOperand(), result);2896decorations.addNonUniform(builder, result);2897}28982899builder.clearAccessChain();2900builder.setAccessChainRValue(result);29012902return false; // done with this node2903}29042905// it must be a special case, check...2906switch (node->getOp()) {2907case glslang::EOpPostIncrement:2908case glslang::EOpPostDecrement:2909case glslang::EOpPreIncrement:2910case glslang::EOpPreDecrement:2911{2912// we need the integer value "1" or the floating point "1.0" to add/subtract2913spv::Id one = 0;2914if (node->getBasicType() == glslang::EbtFloat)2915one = builder.makeFloatConstant(1.0F);2916else if (node->getBasicType() == glslang::EbtDouble)2917one = builder.makeDoubleConstant(1.0);2918else if (node->getBasicType() == glslang::EbtFloat16)2919one = builder.makeFloat16Constant(1.0F);2920else if (node->getBasicType() == glslang::EbtBFloat16)2921one = builder.makeBFloat16Constant(1.0F);2922else if (node->getBasicType() == glslang::EbtFloatE5M2)2923one = builder.makeFloatE5M2Constant(1.0F);2924else if (node->getBasicType() == glslang::EbtFloatE4M3)2925one = builder.makeFloatE4M3Constant(1.0F);2926else if (node->getBasicType() == glslang::EbtInt8 || node->getBasicType() == glslang::EbtUint8)2927one = builder.makeInt8Constant(1);2928else if (node->getBasicType() == glslang::EbtInt16 || node->getBasicType() == glslang::EbtUint16)2929one = builder.makeInt16Constant(1);2930else if (node->getBasicType() == glslang::EbtInt64 || node->getBasicType() == glslang::EbtUint64)2931one = builder.makeInt64Constant(1);2932else2933one = builder.makeIntConstant(1);2934glslang::TOperator op;2935if (node->getOp() == glslang::EOpPreIncrement ||2936node->getOp() == glslang::EOpPostIncrement)2937op = glslang::EOpAdd;2938else2939op = glslang::EOpSub;29402941spv::Id result = createBinaryOperation(op, decorations,2942convertGlslangToSpvType(node->getType()), operand, one,2943node->getType().getBasicType());2944assert(result != spv::NoResult);29452946// The result of operation is always stored, but conditionally the2947// consumed result. The consumed result is always an r-value.2948builder.accessChainStore(result,2949TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags));2950builder.clearAccessChain();2951if (node->getOp() == glslang::EOpPreIncrement ||2952node->getOp() == glslang::EOpPreDecrement)2953builder.setAccessChainRValue(result);2954else2955builder.setAccessChainRValue(operand);2956}29572958return false;29592960case glslang::EOpAssumeEXT:2961builder.addCapability(spv::Capability::ExpectAssumeKHR);2962builder.addExtension(spv::E_SPV_KHR_expect_assume);2963builder.createNoResultOp(spv::Op::OpAssumeTrueKHR, operand);2964return false;2965case glslang::EOpEmitStreamVertex:2966builder.createNoResultOp(spv::Op::OpEmitStreamVertex, operand);2967return false;2968case glslang::EOpEndStreamPrimitive:2969builder.createNoResultOp(spv::Op::OpEndStreamPrimitive, operand);2970return false;2971case glslang::EOpRayQueryTerminate:2972builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR, operand);2973return false;2974case glslang::EOpRayQueryConfirmIntersection:2975builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR, operand);2976return false;2977case glslang::EOpReorderThreadNV:2978builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectNV, operand);2979return false;2980case glslang::EOpReorderThreadEXT:2981builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectEXT, operand);2982return false;2983case glslang::EOpHitObjectRecordEmptyNV:2984builder.createNoResultOp(spv::Op::OpHitObjectRecordEmptyNV, operand);2985return false;2986case glslang::EOpHitObjectRecordEmptyEXT:2987builder.createNoResultOp(spv::Op::OpHitObjectRecordEmptyEXT, operand);2988return false;29892990case glslang::EOpCreateTensorLayoutNV:2991result = builder.createOp(spv::Op::OpCreateTensorLayoutNV, resultType(), std::vector<spv::Id>{});2992builder.clearAccessChain();2993builder.setAccessChainRValue(result);2994return false;29952996case glslang::EOpCreateTensorViewNV:2997result = builder.createOp(spv::Op::OpCreateTensorViewNV, resultType(), std::vector<spv::Id>{});2998builder.clearAccessChain();2999builder.setAccessChainRValue(result);3000return false;30013002default:3003logger->missingFunctionality("unknown glslang unary");3004return true; // pick up operand as placeholder result3005}3006}30073008// Construct a composite object, recursively copying members if their types don't match3009spv::Id TGlslangToSpvTraverser::createCompositeConstruct(spv::Id resultTypeId, std::vector<spv::Id> constituents)3010{3011for (int c = 0; c < (int)constituents.size(); ++c) {3012spv::Id& constituent = constituents[c];3013spv::Id lType = builder.getContainedTypeId(resultTypeId, c);3014spv::Id rType = builder.getTypeId(constituent);3015if (lType != rType) {3016if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {3017constituent = builder.createUnaryOp(spv::Op::OpCopyLogical, lType, constituent);3018} else if (builder.isStructType(rType)) {3019std::vector<spv::Id> rTypeConstituents;3020int numrTypeConstituents = builder.getNumTypeConstituents(rType);3021for (int i = 0; i < numrTypeConstituents; ++i) {3022rTypeConstituents.push_back(builder.createCompositeExtract(constituent,3023builder.getContainedTypeId(rType, i), i));3024}3025constituents[c] = createCompositeConstruct(lType, rTypeConstituents);3026} else {3027assert(builder.isArrayType(rType));3028std::vector<spv::Id> rTypeConstituents;3029int numrTypeConstituents = builder.getNumTypeConstituents(rType);30303031spv::Id elementRType = builder.getContainedTypeId(rType);3032for (int i = 0; i < numrTypeConstituents; ++i) {3033rTypeConstituents.push_back(builder.createCompositeExtract(constituent, elementRType, i));3034}3035constituents[c] = createCompositeConstruct(lType, rTypeConstituents);3036}3037}3038}3039return builder.createCompositeConstruct(resultTypeId, constituents);3040}30413042bool TGlslangToSpvTraverser::visitAggregate(glslang::TVisit visit, glslang::TIntermAggregate* node)3043{3044SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);3045if (node->getType().getQualifier().isSpecConstant())3046spec_constant_op_mode_setter.turnOnSpecConstantOpMode();30473048spv::Id result = spv::NoResult;3049spv::Id invertedType = spv::NoType; // to use to override the natural type of the node3050std::vector<spv::Builder::AccessChain> complexLvalues; // for holding swizzling l-values too complex for3051// SPIR-V, for an out parameter3052std::vector<spv::Id> temporaryLvalues; // temporaries to pass, as proxies for complexLValues30533054auto resultType = [&invertedType, &node, this](){3055if (invertedType != spv::NoType) {3056return invertedType;3057} else {3058auto ret = convertGlslangToSpvType(node->getType());3059// convertGlslangToSpvType may clobber the debug location, reset it3060builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());3061return ret;3062}3063};30643065// try texturing3066result = createImageTextureFunctionCall(node);3067if (result != spv::NoResult) {3068builder.clearAccessChain();3069builder.setAccessChainRValue(result);30703071return false;3072} else if (node->getOp() == glslang::EOpImageStore ||3073node->getOp() == glslang::EOpImageStoreLod ||3074node->getOp() == glslang::EOpImageAtomicStore) {3075// "imageStore" is a special case, which has no result3076return false;3077}30783079glslang::TOperator binOp = glslang::EOpNull;3080bool reduceComparison = true;3081bool isMatrix = false;3082bool noReturnValue = false;3083bool atomic = false;30843085spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;30863087assert(node->getOp());30883089spv::Decoration precision = TranslatePrecisionDecoration(node->getOperationPrecision());30903091switch (node->getOp()) {3092case glslang::EOpScope:3093case glslang::EOpSequence:3094{3095if (visit == glslang::EvPreVisit) {3096++sequenceDepth;3097if (sequenceDepth == 1) {3098// If this is the parent node of all the functions, we want to see them3099// early, so all call points have actual SPIR-V functions to reference.3100// In all cases, still let the traverser visit the children for us.3101makeFunctions(node->getAsAggregate()->getSequence());31023103// Global initializers is specific to the shader entry point, which does not exist in compile-only mode3104if (!options.compileOnly) {3105// Also, we want all globals initializers to go into the beginning of the entry point, before3106// anything else gets there, so visit out of order, doing them all now.3107makeGlobalInitializers(node->getAsAggregate()->getSequence());3108}31093110//Pre process linker objects for ray tracing stages3111if (glslangIntermediate->isRayTracingStage())3112collectRayTracingLinkerObjects();31133114// Initializers are done, don't want to visit again, but functions and link objects need to be processed,3115// so do them manually.3116visitFunctions(node->getAsAggregate()->getSequence());31173118return false;3119} else {3120if (node->getOp() == glslang::EOpScope) {3121auto loc = node->getLoc();3122builder.enterLexicalBlock(loc.line, loc.column);3123}3124}3125} else {3126if (sequenceDepth > 1 && node->getOp() == glslang::EOpScope)3127builder.leaveLexicalBlock();3128--sequenceDepth;3129}31303131return true;3132}3133case glslang::EOpLinkerObjects:3134{3135if (visit == glslang::EvPreVisit)3136linkageOnly = true;3137else3138linkageOnly = false;31393140return true;3141}3142case glslang::EOpComma:3143{3144// processing from left to right naturally leaves the right-most3145// lying around in the access chain3146glslang::TIntermSequence& glslangOperands = node->getSequence();3147for (int i = 0; i < (int)glslangOperands.size(); ++i)3148glslangOperands[i]->traverse(this);31493150return false;3151}3152case glslang::EOpFunction:3153if (visit == glslang::EvPreVisit) {3154if (options.generateDebugInfo) {3155builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());3156}3157if (isShaderEntryPoint(node)) {3158inEntryPoint = true;3159builder.setBuildPoint(shaderEntry->getLastBlock());3160builder.enterFunction(shaderEntry);3161currentFunction = shaderEntry;3162} else {3163// SPIR-V functions should already be in the functionMap from the prepass3164// that called makeFunctions().3165currentFunction = functionMap[node->getName().c_str()];3166spv::Block* functionBlock = currentFunction->getEntryBlock();3167builder.setBuildPoint(functionBlock);3168builder.enterFunction(currentFunction);3169}3170if (options.generateDebugInfo && !options.emitNonSemanticShaderDebugInfo) {3171const auto& loc = node->getLoc();3172const char* sourceFileName = loc.getFilename();3173spv::Id sourceFileId = sourceFileName ? builder.getStringId(sourceFileName) : builder.getMainFileId();3174currentFunction->setDebugLineInfo(sourceFileId, loc.line, loc.column);3175}3176} else {3177// Here we have finished visiting the function (post-visit). Finalize it.3178if (options.generateDebugInfo) {3179if (glslangIntermediate->getSource() == glslang::EShSourceGlsl && node->getSequence().size() > 1) {3180auto endLoc = node->getSequence()[1]->getAsAggregate()->getEndLoc();3181builder.setDebugSourceLocation(endLoc.line, endLoc.getFilename());3182}3183}3184if (inEntryPoint)3185entryPointTerminated = true;3186builder.leaveFunction();3187inEntryPoint = false;3188currentFunction = nullptr;3189}31903191return true;3192case glslang::EOpParameters:3193// Parameters will have been consumed by EOpFunction processing, but not3194// the body, so we still visited the function node's children, making this3195// child redundant.3196return false;3197case glslang::EOpFunctionCall:3198{3199builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());3200if (node->isUserDefined())3201result = handleUserFunctionCall(node);3202if (result) {3203builder.clearAccessChain();3204builder.setAccessChainRValue(result);3205} else3206logger->missingFunctionality("missing user function; linker needs to catch that");32073208return false;3209}3210case glslang::EOpConstructMat2x2:3211case glslang::EOpConstructMat2x3:3212case glslang::EOpConstructMat2x4:3213case glslang::EOpConstructMat3x2:3214case glslang::EOpConstructMat3x3:3215case glslang::EOpConstructMat3x4:3216case glslang::EOpConstructMat4x2:3217case glslang::EOpConstructMat4x3:3218case glslang::EOpConstructMat4x4:3219case glslang::EOpConstructDMat2x2:3220case glslang::EOpConstructDMat2x3:3221case glslang::EOpConstructDMat2x4:3222case glslang::EOpConstructDMat3x2:3223case glslang::EOpConstructDMat3x3:3224case glslang::EOpConstructDMat3x4:3225case glslang::EOpConstructDMat4x2:3226case glslang::EOpConstructDMat4x3:3227case glslang::EOpConstructDMat4x4:3228case glslang::EOpConstructIMat2x2:3229case glslang::EOpConstructIMat2x3:3230case glslang::EOpConstructIMat2x4:3231case glslang::EOpConstructIMat3x2:3232case glslang::EOpConstructIMat3x3:3233case glslang::EOpConstructIMat3x4:3234case glslang::EOpConstructIMat4x2:3235case glslang::EOpConstructIMat4x3:3236case glslang::EOpConstructIMat4x4:3237case glslang::EOpConstructUMat2x2:3238case glslang::EOpConstructUMat2x3:3239case glslang::EOpConstructUMat2x4:3240case glslang::EOpConstructUMat3x2:3241case glslang::EOpConstructUMat3x3:3242case glslang::EOpConstructUMat3x4:3243case glslang::EOpConstructUMat4x2:3244case glslang::EOpConstructUMat4x3:3245case glslang::EOpConstructUMat4x4:3246case glslang::EOpConstructBMat2x2:3247case glslang::EOpConstructBMat2x3:3248case glslang::EOpConstructBMat2x4:3249case glslang::EOpConstructBMat3x2:3250case glslang::EOpConstructBMat3x3:3251case glslang::EOpConstructBMat3x4:3252case glslang::EOpConstructBMat4x2:3253case glslang::EOpConstructBMat4x3:3254case glslang::EOpConstructBMat4x4:3255case glslang::EOpConstructF16Mat2x2:3256case glslang::EOpConstructF16Mat2x3:3257case glslang::EOpConstructF16Mat2x4:3258case glslang::EOpConstructF16Mat3x2:3259case glslang::EOpConstructF16Mat3x3:3260case glslang::EOpConstructF16Mat3x4:3261case glslang::EOpConstructF16Mat4x2:3262case glslang::EOpConstructF16Mat4x3:3263case glslang::EOpConstructF16Mat4x4:3264isMatrix = true;3265[[fallthrough]];3266case glslang::EOpConstructFloat:3267case glslang::EOpConstructVec2:3268case glslang::EOpConstructVec3:3269case glslang::EOpConstructVec4:3270case glslang::EOpConstructDouble:3271case glslang::EOpConstructDVec2:3272case glslang::EOpConstructDVec3:3273case glslang::EOpConstructDVec4:3274case glslang::EOpConstructFloat16:3275case glslang::EOpConstructF16Vec2:3276case glslang::EOpConstructF16Vec3:3277case glslang::EOpConstructF16Vec4:3278case glslang::EOpConstructBFloat16:3279case glslang::EOpConstructBF16Vec2:3280case glslang::EOpConstructBF16Vec3:3281case glslang::EOpConstructBF16Vec4:3282case glslang::EOpConstructFloatE5M2:3283case glslang::EOpConstructFloatE5M2Vec2:3284case glslang::EOpConstructFloatE5M2Vec3:3285case glslang::EOpConstructFloatE5M2Vec4:3286case glslang::EOpConstructFloatE4M3:3287case glslang::EOpConstructFloatE4M3Vec2:3288case glslang::EOpConstructFloatE4M3Vec3:3289case glslang::EOpConstructFloatE4M3Vec4:3290case glslang::EOpConstructBool:3291case glslang::EOpConstructBVec2:3292case glslang::EOpConstructBVec3:3293case glslang::EOpConstructBVec4:3294case glslang::EOpConstructInt8:3295case glslang::EOpConstructI8Vec2:3296case glslang::EOpConstructI8Vec3:3297case glslang::EOpConstructI8Vec4:3298case glslang::EOpConstructUint8:3299case glslang::EOpConstructU8Vec2:3300case glslang::EOpConstructU8Vec3:3301case glslang::EOpConstructU8Vec4:3302case glslang::EOpConstructInt16:3303case glslang::EOpConstructI16Vec2:3304case glslang::EOpConstructI16Vec3:3305case glslang::EOpConstructI16Vec4:3306case glslang::EOpConstructUint16:3307case glslang::EOpConstructU16Vec2:3308case glslang::EOpConstructU16Vec3:3309case glslang::EOpConstructU16Vec4:3310case glslang::EOpConstructInt:3311case glslang::EOpConstructIVec2:3312case glslang::EOpConstructIVec3:3313case glslang::EOpConstructIVec4:3314case glslang::EOpConstructUint:3315case glslang::EOpConstructUVec2:3316case glslang::EOpConstructUVec3:3317case glslang::EOpConstructUVec4:3318case glslang::EOpConstructInt64:3319case glslang::EOpConstructI64Vec2:3320case glslang::EOpConstructI64Vec3:3321case glslang::EOpConstructI64Vec4:3322case glslang::EOpConstructUint64:3323case glslang::EOpConstructU64Vec2:3324case glslang::EOpConstructU64Vec3:3325case glslang::EOpConstructU64Vec4:3326case glslang::EOpConstructStruct:3327case glslang::EOpConstructTextureSampler:3328case glslang::EOpConstructReference:3329case glslang::EOpConstructCooperativeMatrixNV:3330case glslang::EOpConstructCooperativeMatrixKHR:3331case glslang::EOpConstructCooperativeVectorNV:3332case glslang::EOpConstructSaturated:3333{3334builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());3335std::vector<spv::Id> arguments;3336translateArguments(*node, arguments, lvalueCoherentFlags);3337spv::Id constructed;3338if (node->getOp() == glslang::EOpConstructTextureSampler) {3339const glslang::TType& texType = node->getSequence()[0]->getAsTyped()->getType();3340if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6 &&3341texType.getSampler().isBuffer()) {3342// SamplerBuffer is not supported in spirv1.6 so3343// `samplerBuffer(textureBuffer, sampler)` is a no-op3344// and textureBuffer is the result going forward3345constructed = arguments[0];3346} else3347constructed = builder.createOp(spv::Op::OpSampledImage, resultType(), arguments);3348} else if (node->getOp() == glslang::EOpConstructCooperativeMatrixKHR &&3349node->getType().isCoopMatKHR() && node->getSequence()[0]->getAsTyped()->getType().isCoopMatKHR()) {3350builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);3351builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);3352constructed = builder.createCooperativeMatrixConversion(resultType(), arguments[0]);3353} else if (node->getOp() == glslang::EOpConstructCooperativeVectorNV &&3354arguments.size() == 1 &&3355builder.getTypeId(arguments[0]) == resultType()) {3356constructed = arguments[0];3357} else if (node->getOp() == glslang::EOpConstructStruct ||3358node->getOp() == glslang::EOpConstructCooperativeMatrixNV ||3359node->getOp() == glslang::EOpConstructCooperativeMatrixKHR ||3360node->getType().isArray() ||3361// Handle constructing coopvec from one component here, to avoid the component3362// getting smeared3363(node->getOp() == glslang::EOpConstructCooperativeVectorNV && arguments.size() == 1 && builder.isScalar(arguments[0]))) {3364std::vector<spv::Id> constituents;3365for (int c = 0; c < (int)arguments.size(); ++c)3366constituents.push_back(arguments[c]);3367constructed = createCompositeConstruct(resultType(), constituents);3368} else if (isMatrix)3369constructed = builder.createMatrixConstructor(precision, arguments, resultType());3370else if (node->getOp() == glslang::EOpConstructSaturated) {3371OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),3372TranslateNoContractionDecoration(node->getType().getQualifier()),3373TranslateNonUniformDecoration(lvalueCoherentFlags) };33743375constructed = createConversion(node->getOp(), decorations, resultType(), arguments[1],3376node->getType().getBasicType(), node->getSequence()[1]->getAsTyped()->getBasicType());3377builder.addDecoration(constructed, spv::Decoration::SaturatedToLargestFloat8NormalConversionEXT);3378builder.createStore(constructed, arguments[0]);3379}3380else3381constructed = builder.createConstructor(precision, arguments, resultType());33823383if (node->getType().getQualifier().isNonUniform()) {3384builder.addDecoration(constructed, spv::Decoration::NonUniformEXT);3385}33863387builder.clearAccessChain();3388builder.setAccessChainRValue(constructed);33893390return false;3391}33923393// These six are component-wise compares with component-wise results.3394// Forward on to createBinaryOperation(), requesting a vector result.3395case glslang::EOpLessThan:3396case glslang::EOpGreaterThan:3397case glslang::EOpLessThanEqual:3398case glslang::EOpGreaterThanEqual:3399case glslang::EOpVectorEqual:3400case glslang::EOpVectorNotEqual:3401{3402// Map the operation to a binary3403binOp = node->getOp();3404reduceComparison = false;3405switch (node->getOp()) {3406case glslang::EOpVectorEqual: binOp = glslang::EOpVectorEqual; break;3407case glslang::EOpVectorNotEqual: binOp = glslang::EOpVectorNotEqual; break;3408default: binOp = node->getOp(); break;3409}34103411break;3412}3413case glslang::EOpMul:3414// component-wise matrix multiply3415binOp = glslang::EOpMul;3416break;3417case glslang::EOpOuterProduct:3418// two vectors multiplied to make a matrix3419binOp = glslang::EOpOuterProduct;3420break;3421case glslang::EOpDot:3422{3423// for scalar dot product, use multiply3424glslang::TIntermSequence& glslangOperands = node->getSequence();3425if (glslangOperands[0]->getAsTyped()->getVectorSize() == 1)3426binOp = glslang::EOpMul;3427break;3428}3429case glslang::EOpMod:3430// when an aggregate, this is the floating-point mod built-in function,3431// which can be emitted by the one in createBinaryOperation()3432binOp = glslang::EOpMod;3433break;34343435case glslang::EOpEmitVertex:3436case glslang::EOpEndPrimitive:3437case glslang::EOpBarrier:3438case glslang::EOpMemoryBarrier:3439case glslang::EOpMemoryBarrierAtomicCounter:3440case glslang::EOpMemoryBarrierBuffer:3441case glslang::EOpMemoryBarrierImage:3442case glslang::EOpMemoryBarrierShared:3443case glslang::EOpGroupMemoryBarrier:3444case glslang::EOpDeviceMemoryBarrier:3445case glslang::EOpAllMemoryBarrierWithGroupSync:3446case glslang::EOpDeviceMemoryBarrierWithGroupSync:3447case glslang::EOpWorkgroupMemoryBarrier:3448case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:3449case glslang::EOpSubgroupBarrier:3450case glslang::EOpSubgroupMemoryBarrier:3451case glslang::EOpSubgroupMemoryBarrierBuffer:3452case glslang::EOpSubgroupMemoryBarrierImage:3453case glslang::EOpSubgroupMemoryBarrierShared:3454noReturnValue = true;3455// These all have 0 operands and will naturally finish up in the code below for 0 operands3456break;34573458case glslang::EOpAtomicAdd:3459case glslang::EOpAtomicSubtract:3460case glslang::EOpAtomicMin:3461case glslang::EOpAtomicMax:3462case glslang::EOpAtomicAnd:3463case glslang::EOpAtomicOr:3464case glslang::EOpAtomicXor:3465case glslang::EOpAtomicExchange:3466case glslang::EOpAtomicCompSwap:3467atomic = true;3468break;34693470case glslang::EOpAtomicStore:3471noReturnValue = true;3472[[fallthrough]];3473case glslang::EOpAtomicLoad:3474atomic = true;3475break;34763477case glslang::EOpAtomicCounterAdd:3478case glslang::EOpAtomicCounterSubtract:3479case glslang::EOpAtomicCounterMin:3480case glslang::EOpAtomicCounterMax:3481case glslang::EOpAtomicCounterAnd:3482case glslang::EOpAtomicCounterOr:3483case glslang::EOpAtomicCounterXor:3484case glslang::EOpAtomicCounterExchange:3485case glslang::EOpAtomicCounterCompSwap:3486builder.addExtension("SPV_KHR_shader_atomic_counter_ops");3487builder.addCapability(spv::Capability::AtomicStorageOps);3488atomic = true;3489break;34903491case glslang::EOpAbsDifference:3492case glslang::EOpAddSaturate:3493case glslang::EOpSubSaturate:3494case glslang::EOpAverage:3495case glslang::EOpAverageRounded:3496case glslang::EOpMul32x16:3497builder.addCapability(spv::Capability::IntegerFunctions2INTEL);3498builder.addExtension("SPV_INTEL_shader_integer_functions2");3499binOp = node->getOp();3500break;35013502case glslang::EOpExpectEXT:3503builder.addCapability(spv::Capability::ExpectAssumeKHR);3504builder.addExtension(spv::E_SPV_KHR_expect_assume);3505binOp = node->getOp();3506break;35073508case glslang::EOpIgnoreIntersectionNV:3509case glslang::EOpTerminateRayNV:3510case glslang::EOpTraceNV:3511case glslang::EOpTraceRayMotionNV:3512case glslang::EOpTraceKHR:3513case glslang::EOpExecuteCallableNV:3514case glslang::EOpExecuteCallableKHR:3515case glslang::EOpWritePackedPrimitiveIndices4x8NV:3516case glslang::EOpEmitMeshTasksEXT:3517case glslang::EOpSetMeshOutputsEXT:3518noReturnValue = true;3519break;3520case glslang::EOpRayQueryInitialize:3521case glslang::EOpRayQueryTerminate:3522case glslang::EOpRayQueryGenerateIntersection:3523case glslang::EOpRayQueryConfirmIntersection:3524builder.addExtension("SPV_KHR_ray_query");3525builder.addCapability(spv::Capability::RayQueryKHR);3526noReturnValue = true;3527break;3528case glslang::EOpRayQueryProceed:3529case glslang::EOpRayQueryGetIntersectionType:3530case glslang::EOpRayQueryGetRayTMin:3531case glslang::EOpRayQueryGetRayFlags:3532case glslang::EOpRayQueryGetIntersectionT:3533case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:3534case glslang::EOpRayQueryGetIntersectionInstanceId:3535case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:3536case glslang::EOpRayQueryGetIntersectionGeometryIndex:3537case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:3538case glslang::EOpRayQueryGetIntersectionBarycentrics:3539case glslang::EOpRayQueryGetIntersectionFrontFace:3540case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:3541case glslang::EOpRayQueryGetIntersectionObjectRayDirection:3542case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:3543case glslang::EOpRayQueryGetWorldRayDirection:3544case glslang::EOpRayQueryGetWorldRayOrigin:3545case glslang::EOpRayQueryGetIntersectionObjectToWorld:3546case glslang::EOpRayQueryGetIntersectionWorldToObject:3547builder.addExtension("SPV_KHR_ray_query");3548builder.addCapability(spv::Capability::RayQueryKHR);3549break;3550case glslang::EOpCooperativeMatrixLoad:3551case glslang::EOpCooperativeMatrixStore:3552case glslang::EOpCooperativeMatrixLoadNV:3553case glslang::EOpCooperativeMatrixStoreNV:3554case glslang::EOpCooperativeMatrixLoadTensorNV:3555case glslang::EOpCooperativeMatrixStoreTensorNV:3556case glslang::EOpCooperativeMatrixReduceNV:3557case glslang::EOpCooperativeMatrixPerElementOpNV:3558case glslang::EOpCooperativeMatrixTransposeNV:3559case glslang::EOpCooperativeVectorMatMulNV:3560case glslang::EOpCooperativeVectorMatMulAddNV:3561case glslang::EOpCooperativeVectorLoadNV:3562case glslang::EOpCooperativeVectorStoreNV:3563case glslang::EOpCooperativeVectorOuterProductAccumulateNV:3564case glslang::EOpCooperativeVectorReduceSumAccumulateNV:3565noReturnValue = true;3566break;3567case glslang::EOpBeginInvocationInterlock:3568case glslang::EOpEndInvocationInterlock:3569builder.addExtension(spv::E_SPV_EXT_fragment_shader_interlock);3570noReturnValue = true;3571break;35723573case glslang::EOpHitObjectTraceRayNV:3574case glslang::EOpHitObjectTraceRayMotionNV:3575case glslang::EOpHitObjectGetAttributesNV:3576case glslang::EOpHitObjectExecuteShaderNV:3577case glslang::EOpHitObjectRecordEmptyNV:3578case glslang::EOpHitObjectRecordMissNV:3579case glslang::EOpHitObjectRecordMissMotionNV:3580case glslang::EOpHitObjectRecordHitNV:3581case glslang::EOpHitObjectRecordHitMotionNV:3582case glslang::EOpHitObjectRecordHitWithIndexNV:3583case glslang::EOpHitObjectRecordHitWithIndexMotionNV:3584case glslang::EOpReorderThreadNV:3585noReturnValue = true;3586[[fallthrough]];3587case glslang::EOpHitObjectIsEmptyNV:3588case glslang::EOpHitObjectIsMissNV:3589case glslang::EOpHitObjectIsHitNV:3590case glslang::EOpHitObjectGetRayTMinNV:3591case glslang::EOpHitObjectGetRayTMaxNV:3592case glslang::EOpHitObjectGetObjectRayOriginNV:3593case glslang::EOpHitObjectGetObjectRayDirectionNV:3594case glslang::EOpHitObjectGetWorldRayOriginNV:3595case glslang::EOpHitObjectGetWorldRayDirectionNV:3596case glslang::EOpHitObjectGetObjectToWorldNV:3597case glslang::EOpHitObjectGetWorldToObjectNV:3598case glslang::EOpHitObjectGetInstanceCustomIndexNV:3599case glslang::EOpHitObjectGetInstanceIdNV:3600case glslang::EOpHitObjectGetGeometryIndexNV:3601case glslang::EOpHitObjectGetPrimitiveIndexNV:3602case glslang::EOpHitObjectGetHitKindNV:3603case glslang::EOpHitObjectGetCurrentTimeNV:3604case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:3605case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:3606builder.addExtension(spv::E_SPV_NV_shader_invocation_reorder);3607builder.addCapability(spv::Capability::ShaderInvocationReorderNV);3608break;36093610case glslang::EOpHitObjectGetLSSPositionsNV:3611case glslang::EOpHitObjectGetLSSRadiiNV:3612builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);3613builder.addCapability(spv::Capability::ShaderInvocationReorderNV);3614builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);3615noReturnValue = true;3616break;36173618case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:3619case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:3620builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);3621builder.addCapability(spv::Capability::RayQueryKHR);3622builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);3623noReturnValue = true;3624break;36253626case glslang::EOpRayQueryGetIntersectionSpherePositionNV:3627case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:3628case glslang::EOpRayQueryIsSphereHitNV:3629builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);3630builder.addCapability(spv::Capability::RayQueryKHR);3631builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);3632builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);3633break;36343635case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:3636case glslang::EOpRayQueryIsLSSHitNV:3637builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);3638builder.addCapability(spv::Capability::RayQueryKHR);3639builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);3640break;36413642case glslang::EOpHitObjectTraceRayEXT:3643case glslang::EOpHitObjectTraceRayMotionEXT:3644case glslang::EOpHitObjectGetAttributesEXT:3645case glslang::EOpHitObjectExecuteShaderEXT:3646case glslang::EOpHitObjectRecordEmptyEXT:3647case glslang::EOpHitObjectRecordMissEXT:3648case glslang::EOpHitObjectRecordMissMotionEXT:3649case glslang::EOpReorderThreadEXT:3650case glslang::EOpHitObjectSetShaderBindingTableRecordIndexEXT:3651case glslang::EOpHitObjectReorderExecuteEXT:3652case glslang::EOpHitObjectTraceReorderExecuteEXT:3653case glslang::EOpHitObjectTraceMotionReorderExecuteEXT:3654case glslang::EOpHitObjectRecordFromQueryEXT:3655case glslang::EOpHitObjectGetIntersectionTriangleVertexPositionsEXT:3656noReturnValue = true;3657[[fallthrough]];3658case glslang::EOpHitObjectIsEmptyEXT:3659case glslang::EOpHitObjectIsMissEXT:3660case glslang::EOpHitObjectIsHitEXT:3661case glslang::EOpHitObjectGetRayTMinEXT:3662case glslang::EOpHitObjectGetRayTMaxEXT:3663case glslang::EOpHitObjectGetRayFlagsEXT:3664case glslang::EOpHitObjectGetObjectRayOriginEXT:3665case glslang::EOpHitObjectGetObjectRayDirectionEXT:3666case glslang::EOpHitObjectGetWorldRayOriginEXT:3667case glslang::EOpHitObjectGetWorldRayDirectionEXT:3668case glslang::EOpHitObjectGetObjectToWorldEXT:3669case glslang::EOpHitObjectGetWorldToObjectEXT:3670case glslang::EOpHitObjectGetInstanceCustomIndexEXT:3671case glslang::EOpHitObjectGetInstanceIdEXT:3672case glslang::EOpHitObjectGetGeometryIndexEXT:3673case glslang::EOpHitObjectGetPrimitiveIndexEXT:3674case glslang::EOpHitObjectGetHitKindEXT:3675case glslang::EOpHitObjectGetCurrentTimeEXT:3676case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:3677case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:3678builder.addExtension(spv::E_SPV_EXT_shader_invocation_reorder);3679builder.addCapability(spv::Capability::ShaderInvocationReorderEXT);3680break;36813682case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:3683builder.addExtension(spv::E_SPV_KHR_ray_tracing_position_fetch);3684builder.addCapability(spv::Capability::RayQueryPositionFetchKHR);3685noReturnValue = true;3686break;3687case glslang::EOpImageSampleWeightedQCOM:3688builder.addCapability(spv::Capability::TextureSampleWeightedQCOM);3689builder.addExtension(spv::E_SPV_QCOM_image_processing);3690break;3691case glslang::EOpImageBoxFilterQCOM:3692builder.addCapability(spv::Capability::TextureBoxFilterQCOM);3693builder.addExtension(spv::E_SPV_QCOM_image_processing);3694break;3695case glslang::EOpImageBlockMatchSADQCOM:3696case glslang::EOpImageBlockMatchSSDQCOM:3697builder.addCapability(spv::Capability::TextureBlockMatchQCOM);3698builder.addExtension(spv::E_SPV_QCOM_image_processing);3699break;3700case glslang::EOpTensorWriteARM:3701noReturnValue = true;3702break;37033704case glslang::EOpImageBlockMatchWindowSSDQCOM:3705case glslang::EOpImageBlockMatchWindowSADQCOM:3706builder.addCapability(spv::Capability::TextureBlockMatchQCOM);3707builder.addExtension(spv::E_SPV_QCOM_image_processing);3708builder.addCapability(spv::Capability::TextureBlockMatch2QCOM);3709builder.addExtension(spv::E_SPV_QCOM_image_processing2);3710break;37113712case glslang::EOpImageBlockMatchGatherSSDQCOM:3713case glslang::EOpImageBlockMatchGatherSADQCOM:3714builder.addCapability(spv::Capability::TextureBlockMatchQCOM);3715builder.addExtension(spv::E_SPV_QCOM_image_processing);3716builder.addCapability(spv::Capability::TextureBlockMatch2QCOM);3717builder.addExtension(spv::E_SPV_QCOM_image_processing2);3718break;37193720case glslang::EOpFetchMicroTriangleVertexPositionNV:3721case glslang::EOpFetchMicroTriangleVertexBarycentricNV:3722builder.addExtension(spv::E_SPV_NV_displacement_micromap);3723builder.addCapability(spv::Capability::DisplacementMicromapNV);3724break;37253726case glslang::EOpRayQueryGetIntersectionClusterIdNV:3727builder.addExtension(spv::E_SPV_NV_cluster_acceleration_structure);3728builder.addCapability(spv::Capability::RayQueryKHR);3729builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);3730break;37313732case glslang::EOpDebugPrintf:3733noReturnValue = true;3734break;37353736default:3737break;3738}37393740//3741// See if it maps to a regular operation.3742//3743if (binOp != glslang::EOpNull) {3744glslang::TIntermTyped* left = node->getSequence()[0]->getAsTyped();3745glslang::TIntermTyped* right = node->getSequence()[1]->getAsTyped();3746assert(left && right);37473748builder.clearAccessChain();3749left->traverse(this);3750spv::Id leftId = accessChainLoad(left->getType());37513752builder.clearAccessChain();3753right->traverse(this);3754spv::Id rightId = accessChainLoad(right->getType());37553756builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());3757OpDecorations decorations = { precision,3758TranslateNoContractionDecoration(node->getType().getQualifier()),3759TranslateNonUniformDecoration(node->getType().getQualifier()) };3760result = createBinaryOperation(binOp, decorations,3761resultType(), leftId, rightId,3762left->getType().getBasicType(), reduceComparison);37633764// code above should only make binOp that exists in createBinaryOperation3765assert(result != spv::NoResult);3766builder.clearAccessChain();3767builder.setAccessChainRValue(result);37683769return false;3770}37713772//3773// Create the list of operands.3774//3775glslang::TIntermSequence& glslangOperands = node->getSequence();3776std::vector<spv::Id> operands;3777std::vector<spv::IdImmediate> memoryAccessOperands;3778for (int arg = 0; arg < (int)glslangOperands.size(); ++arg) {3779// special case l-value operands; there are just a few3780bool lvalue = false;3781switch (node->getOp()) {3782case glslang::EOpModf:3783if (arg == 1)3784lvalue = true;3785break;3786378737883789case glslang::EOpHitObjectRecordFromQueryEXT:3790case glslang::EOpHitObjectGetIntersectionTriangleVertexPositionsEXT:3791if (arg == 0 || arg == 1)3792lvalue = true;3793break;37943795case glslang::EOpHitObjectRecordHitNV:3796case glslang::EOpHitObjectRecordHitMotionNV:3797case glslang::EOpHitObjectRecordHitWithIndexNV:3798case glslang::EOpHitObjectRecordHitWithIndexMotionNV:3799case glslang::EOpHitObjectTraceRayNV:3800case glslang::EOpHitObjectTraceRayMotionNV:3801case glslang::EOpHitObjectExecuteShaderNV:3802case glslang::EOpHitObjectRecordMissNV:3803case glslang::EOpHitObjectRecordMissMotionNV:3804case glslang::EOpHitObjectGetAttributesNV:3805case glslang::EOpHitObjectGetClusterIdNV:3806case glslang::EOpHitObjectTraceRayEXT:3807case glslang::EOpHitObjectTraceRayMotionEXT:3808case glslang::EOpHitObjectExecuteShaderEXT:3809case glslang::EOpHitObjectRecordMissEXT:3810case glslang::EOpHitObjectRecordMissMotionEXT:3811case glslang::EOpHitObjectGetAttributesEXT:3812case glslang::EOpHitObjectSetShaderBindingTableRecordIndexEXT:3813case glslang::EOpHitObjectReorderExecuteEXT:3814case glslang::EOpHitObjectTraceReorderExecuteEXT:3815case glslang::EOpHitObjectTraceMotionReorderExecuteEXT:3816if (arg == 0)3817lvalue = true;3818break;38193820case glslang::EOpHitObjectGetLSSPositionsNV:3821case glslang::EOpHitObjectGetLSSRadiiNV:3822lvalue = true;3823break;38243825case glslang::EOpRayQueryInitialize:3826case glslang::EOpRayQueryTerminate:3827case glslang::EOpRayQueryConfirmIntersection:3828case glslang::EOpRayQueryProceed:3829case glslang::EOpRayQueryGenerateIntersection:3830case glslang::EOpRayQueryGetIntersectionType:3831case glslang::EOpRayQueryGetIntersectionT:3832case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:3833case glslang::EOpRayQueryGetIntersectionInstanceId:3834case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:3835case glslang::EOpRayQueryGetIntersectionGeometryIndex:3836case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:3837case glslang::EOpRayQueryGetIntersectionBarycentrics:3838case glslang::EOpRayQueryGetIntersectionFrontFace:3839case glslang::EOpRayQueryGetIntersectionObjectRayDirection:3840case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:3841case glslang::EOpRayQueryGetIntersectionObjectToWorld:3842case glslang::EOpRayQueryGetIntersectionWorldToObject:3843case glslang::EOpRayQueryGetIntersectionClusterIdNV:3844case glslang::EOpRayQueryGetIntersectionSpherePositionNV:3845case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:3846case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:3847case glslang::EOpRayQueryIsSphereHitNV:3848case glslang::EOpRayQueryIsLSSHitNV:3849if (arg == 0)3850lvalue = true;3851break;38523853case glslang::EOpAtomicAdd:3854case glslang::EOpAtomicSubtract:3855case glslang::EOpAtomicMin:3856case glslang::EOpAtomicMax:3857case glslang::EOpAtomicAnd:3858case glslang::EOpAtomicOr:3859case glslang::EOpAtomicXor:3860case glslang::EOpAtomicExchange:3861case glslang::EOpAtomicCompSwap:3862if (arg == 0)3863lvalue = true;3864break;38653866case glslang::EOpFrexp:3867if (arg == 1)3868lvalue = true;3869break;3870case glslang::EOpInterpolateAtSample:3871case glslang::EOpInterpolateAtOffset:3872case glslang::EOpInterpolateAtVertex:3873if (arg == 0) {3874// If GLSL, use the address of the interpolant argument.3875// If HLSL, use an internal version of OpInterolates that takes3876// the rvalue of the interpolant. A fixup pass in spirv-opt3877// legalization will remove the OpLoad and convert to an lvalue.3878// Had to do this because legalization will only propagate a3879// builtin into an rvalue.3880lvalue = glslangIntermediate->getSource() != glslang::EShSourceHlsl;38813882// Does it need a swizzle inversion? If so, evaluation is inverted;3883// operate first on the swizzle base, then apply the swizzle.3884// That is, we transform3885//3886// interpolate(v.zy) -> interpolate(v).zy3887//3888if (glslangOperands[0]->getAsOperator() &&3889glslangOperands[0]->getAsOperator()->getOp() == glslang::EOpVectorSwizzle)3890invertedType = convertGlslangToSpvType(3891glslangOperands[0]->getAsBinaryNode()->getLeft()->getType());3892}3893break;3894case glslang::EOpAtomicLoad:3895case glslang::EOpAtomicStore:3896case glslang::EOpAtomicCounterAdd:3897case glslang::EOpAtomicCounterSubtract:3898case glslang::EOpAtomicCounterMin:3899case glslang::EOpAtomicCounterMax:3900case glslang::EOpAtomicCounterAnd:3901case glslang::EOpAtomicCounterOr:3902case glslang::EOpAtomicCounterXor:3903case glslang::EOpAtomicCounterExchange:3904case glslang::EOpAtomicCounterCompSwap:3905if (arg == 0)3906lvalue = true;3907break;3908case glslang::EOpAddCarry:3909case glslang::EOpSubBorrow:3910if (arg == 2)3911lvalue = true;3912break;3913case glslang::EOpUMulExtended:3914case glslang::EOpIMulExtended:3915if (arg >= 2)3916lvalue = true;3917break;3918case glslang::EOpCooperativeMatrixLoad:3919case glslang::EOpCooperativeMatrixLoadNV:3920case glslang::EOpCooperativeMatrixLoadTensorNV:3921case glslang::EOpCooperativeVectorLoadNV:3922if (arg == 0 || arg == 1)3923lvalue = true;3924break;3925case glslang::EOpCooperativeMatrixStore:3926case glslang::EOpCooperativeMatrixStoreNV:3927case glslang::EOpCooperativeMatrixStoreTensorNV:3928case glslang::EOpCooperativeVectorStoreNV:3929if (arg == 1)3930lvalue = true;3931break;3932case glslang::EOpCooperativeVectorMatMulNV:3933if (arg == 0 || arg == 3)3934lvalue = true;3935break;3936case glslang::EOpCooperativeVectorMatMulAddNV:3937if (arg == 0 || arg == 3 || arg == 6)3938lvalue = true;3939break;3940case glslang::EOpCooperativeVectorOuterProductAccumulateNV:3941if (arg == 2)3942lvalue = true;3943break;3944case glslang::EOpCooperativeVectorReduceSumAccumulateNV:3945if (arg == 1)3946lvalue = true;3947break;3948case glslang::EOpCooperativeMatrixReduceNV:3949case glslang::EOpCooperativeMatrixPerElementOpNV:3950case glslang::EOpCooperativeMatrixTransposeNV:3951if (arg == 0)3952lvalue = true;3953break;3954case glslang::EOpSpirvInst:3955if (glslangOperands[arg]->getAsTyped()->getQualifier().isSpirvByReference())3956lvalue = true;3957break;3958case glslang::EOpReorderThreadNV:3959case glslang::EOpReorderThreadEXT:3960//Three variants of reorderThreadNV, two of them use hitObjectNV3961if (arg == 0 && glslangOperands.size() != 2)3962lvalue = true;3963break;3964case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:3965case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:3966case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:3967if (arg == 0 || arg == 2)3968lvalue = true;3969break;3970case glslang::EOpTensorReadARM:3971if (arg == 2)3972lvalue = true;3973break;3974default:3975break;3976}3977builder.clearAccessChain();3978if (invertedType != spv::NoType && arg == 0)3979glslangOperands[0]->getAsBinaryNode()->getLeft()->traverse(this);3980else3981glslangOperands[arg]->traverse(this);39823983bool isCoopMat = node->getOp() == glslang::EOpCooperativeMatrixLoad ||3984node->getOp() == glslang::EOpCooperativeMatrixStore ||3985node->getOp() == glslang::EOpCooperativeMatrixLoadNV ||3986node->getOp() == glslang::EOpCooperativeMatrixStoreNV ||3987node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV ||3988node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV;3989bool isCoopVec = node->getOp() == glslang::EOpCooperativeVectorLoadNV ||3990node->getOp() == glslang::EOpCooperativeVectorStoreNV;3991if (isCoopMat || isCoopVec) {39923993if (arg == 1) {3994spv::Builder::AccessChain::CoherentFlags coherentFlags {};3995unsigned int alignment {};3996if (isCoopMat) {3997// fold "element" parameter into the access chain3998spv::Builder::AccessChain save = builder.getAccessChain();3999builder.clearAccessChain();4000glslangOperands[2]->traverse(this);40014002spv::Id elementId = accessChainLoad(glslangOperands[2]->getAsTyped()->getType());40034004builder.setAccessChain(save);40054006// Point to the first element of the array.4007builder.accessChainPush(elementId,4008TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType()),4009glslangOperands[arg]->getAsTyped()->getType().getBufferReferenceAlignment());4010coherentFlags = builder.getAccessChain().coherentFlags;4011alignment = builder.getAccessChain().alignment;4012} else {4013coherentFlags = builder.getAccessChain().coherentFlags;4014coherentFlags |= TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType());4015alignment = 16;4016}40174018spv::MemoryAccessMask memoryAccess = TranslateMemoryAccess(coherentFlags);4019if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||4020node->getOp() == glslang::EOpCooperativeMatrixLoadNV ||4021node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV ||4022node->getOp() == glslang::EOpCooperativeVectorLoadNV)4023memoryAccess = (memoryAccess & ~spv::MemoryAccessMask::MakePointerAvailableKHR);4024if (node->getOp() == glslang::EOpCooperativeMatrixStore ||4025node->getOp() == glslang::EOpCooperativeMatrixStoreNV ||4026node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV ||4027node->getOp() == glslang::EOpCooperativeVectorStoreNV)4028memoryAccess = (memoryAccess & ~spv::MemoryAccessMask::MakePointerVisibleKHR);4029if (builder.getStorageClass(builder.getAccessChain().base) ==4030spv::StorageClass::PhysicalStorageBufferEXT) {4031memoryAccess = (spv::MemoryAccessMask)(memoryAccess | spv::MemoryAccessMask::Aligned);4032}40334034memoryAccessOperands.push_back(spv::IdImmediate(false, memoryAccess));40354036if (anySet(memoryAccess, spv::MemoryAccessMask::Aligned)) {4037memoryAccessOperands.push_back(spv::IdImmediate(false, alignment));4038}40394040if (anySet(memoryAccess,4041spv::MemoryAccessMask::MakePointerAvailableKHR | spv::MemoryAccessMask::MakePointerVisibleKHR)) {4042memoryAccessOperands.push_back(spv::IdImmediate(true,4043builder.makeUintConstant(TranslateMemoryScope(coherentFlags))));4044}4045} else if (isCoopMat && arg == 2) {4046continue;4047}4048}40494050// for l-values, pass the address, for r-values, pass the value4051if (lvalue) {4052if (invertedType == spv::NoType && !builder.isSpvLvalue()) {4053// SPIR-V cannot represent an l-value containing a swizzle that doesn't4054// reduce to a simple access chain. So, we need a temporary vector to4055// receive the result, and must later swizzle that into the original4056// l-value.4057complexLvalues.push_back(builder.getAccessChain());4058temporaryLvalues.push_back(builder.createVariable(4059spv::NoPrecision, spv::StorageClass::Function,4060builder.accessChainGetInferredType(), "swizzleTemp"));4061operands.push_back(temporaryLvalues.back());4062} else {4063operands.push_back(builder.accessChainGetLValue());4064}4065lvalueCoherentFlags = builder.getAccessChain().coherentFlags;4066lvalueCoherentFlags |= TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType());4067} else {4068builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());4069glslang::TOperator glslangOp = node->getOp();4070if (arg == 1 &&4071(glslangOp == glslang::EOpRayQueryGetIntersectionType ||4072glslangOp == glslang::EOpRayQueryGetIntersectionT ||4073glslangOp == glslang::EOpRayQueryGetIntersectionInstanceCustomIndex ||4074glslangOp == glslang::EOpRayQueryGetIntersectionInstanceId ||4075glslangOp == glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset ||4076glslangOp == glslang::EOpRayQueryGetIntersectionGeometryIndex ||4077glslangOp == glslang::EOpRayQueryGetIntersectionPrimitiveIndex ||4078glslangOp == glslang::EOpRayQueryGetIntersectionBarycentrics ||4079glslangOp == glslang::EOpRayQueryGetIntersectionFrontFace ||4080glslangOp == glslang::EOpRayQueryGetIntersectionObjectRayDirection ||4081glslangOp == glslang::EOpRayQueryGetIntersectionObjectRayOrigin ||4082glslangOp == glslang::EOpRayQueryGetIntersectionObjectToWorld ||4083glslangOp == glslang::EOpRayQueryGetIntersectionWorldToObject ||4084glslangOp == glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT ||4085glslangOp == glslang::EOpRayQueryGetIntersectionClusterIdNV ||4086glslangOp == glslang::EOpRayQueryGetIntersectionSpherePositionNV ||4087glslangOp == glslang::EOpRayQueryGetIntersectionSphereRadiusNV ||4088glslangOp == glslang::EOpRayQueryGetIntersectionLSSHitValueNV ||4089glslangOp == glslang::EOpRayQueryGetIntersectionLSSPositionsNV ||4090glslangOp == glslang::EOpRayQueryGetIntersectionLSSRadiiNV ||4091glslangOp == glslang::EOpRayQueryIsLSSHitNV ||4092glslangOp == glslang::EOpRayQueryIsSphereHitNV4093)) {4094bool cond = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getBConst();4095operands.push_back(builder.makeIntConstant(cond ? 1 : 0));4096} else if ((arg == 10 && glslangOp == glslang::EOpTraceKHR) ||4097(arg == 11 && glslangOp == glslang::EOpTraceRayMotionNV) ||4098(arg == 1 && glslangOp == glslang::EOpExecuteCallableKHR) ||4099(arg == 1 && glslangOp == glslang::EOpHitObjectExecuteShaderNV) ||4100(arg == 1 && glslangOp == glslang::EOpHitObjectExecuteShaderEXT) ||4101(arg == 11 && glslangOp == glslang::EOpHitObjectTraceRayNV) ||4102(arg == 11 && glslangOp == glslang::EOpHitObjectTraceRayEXT) ||4103(arg == 12 && glslangOp == glslang::EOpHitObjectTraceRayMotionNV) ||4104(arg == 12 && glslangOp == glslang::EOpHitObjectTraceRayMotionEXT) ||4105(arg == 12 && glslangOp == glslang::EOpHitObjectTraceMotionReorderExecuteEXT && glslangOperands.size() == 13) ||4106(arg == 14 && glslangOp == glslang::EOpHitObjectTraceMotionReorderExecuteEXT && glslangOperands.size() == 15) ||4107(arg == 11 && glslangOp == glslang::EOpHitObjectTraceReorderExecuteEXT && glslangOperands.size() == 12) ||4108(arg == 13 && glslangOp == glslang::EOpHitObjectTraceReorderExecuteEXT && glslangOperands.size() == 14) ||4109(arg == 1 && glslangOp == glslang::EOpHitObjectReorderExecuteEXT && glslangOperands.size() == 2) ||4110(arg == 3 && glslangOp == glslang::EOpHitObjectReorderExecuteEXT && glslangOperands.size() == 4)) {4111const int set = glslangOp == glslang::EOpExecuteCallableKHR ? 1 : 0;4112const int location = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getUConst();4113auto itNode = locationToSymbol[set].find(location);4114visitSymbol(itNode->second);4115spv::Id symId = getSymbolId(itNode->second);4116operands.push_back(symId);4117} else if ((arg == 12 && glslangOp == glslang::EOpHitObjectRecordHitNV) ||4118(arg == 13 && glslangOp == glslang::EOpHitObjectRecordHitMotionNV) ||4119(arg == 11 && glslangOp == glslang::EOpHitObjectRecordHitWithIndexNV) ||4120(arg == 12 && glslangOp == glslang::EOpHitObjectRecordHitWithIndexMotionNV) ||4121(arg == 3 && glslangOp == glslang::EOpHitObjectRecordFromQueryEXT) ||4122(arg == 1 && glslangOp == glslang::EOpHitObjectGetAttributesEXT) ||4123(arg == 1 && glslangOp == glslang::EOpHitObjectGetAttributesNV)) {4124const int location = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getUConst();4125const int set = 2;4126auto itNode = locationToSymbol[set].find(location);4127visitSymbol(itNode->second);4128spv::Id symId = getSymbolId(itNode->second);4129operands.push_back(symId);4130} else if (glslangOperands[arg]->getAsTyped()->getQualifier().isSpirvLiteral()) {4131// Will be translated to a literal value, make a placeholder here4132operands.push_back(spv::NoResult);4133} else if (glslangOperands[arg]->getAsTyped()->getBasicType() == glslang::EbtFunction) {4134spv::Function* function = functionMap[glslangOperands[arg]->getAsSymbolNode()->getMangledName().c_str()];4135assert(function);4136operands.push_back(function->getId());4137} else {4138operands.push_back(accessChainLoad(glslangOperands[arg]->getAsTyped()->getType()));4139}4140}4141}41424143builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());4144if (node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV) {4145std::vector<spv::IdImmediate> idImmOps;41464147builder.addCapability(spv::Capability::CooperativeMatrixTensorAddressingNV);4148builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);41494150spv::Id object = builder.createLoad(operands[0], spv::NoPrecision);41514152idImmOps.push_back(spv::IdImmediate(true, operands[1])); // Pointer4153idImmOps.push_back(spv::IdImmediate(true, object)); // Object4154idImmOps.push_back(spv::IdImmediate(true, operands[2])); // tensorLayout41554156idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end()); // memoryaccess41574158// initialize tensor operands to zero, then OR in flags based on the operands4159size_t tensorOpIdx = idImmOps.size();4160idImmOps.push_back(spv::IdImmediate(false, 0));41614162for (uint32_t i = 3; i < operands.size(); ++i) {4163if (builder.isTensorView(operands[i])) {4164addMask(idImmOps[tensorOpIdx].word, spv::TensorAddressingOperandsMask::TensorView);4165} else {4166// must be the decode func4167addMask(idImmOps[tensorOpIdx].word, spv::TensorAddressingOperandsMask::DecodeFunc);4168builder.addCapability(spv::Capability::CooperativeMatrixBlockLoadsNV);4169}4170idImmOps.push_back(spv::IdImmediate(true, operands[i])); // tensorView or decodeFunc4171}41724173// get the pointee type4174spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));4175assert(builder.isCooperativeMatrixType(typeId));4176// do the op4177spv::Id result = builder.createOp(spv::Op::OpCooperativeMatrixLoadTensorNV, typeId, idImmOps);4178// store the result to the pointer (out param 'm')4179builder.createStore(result, operands[0]);4180result = 0;4181} else if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||4182node->getOp() == glslang::EOpCooperativeMatrixLoadNV) {4183std::vector<spv::IdImmediate> idImmOps;41844185idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf4186if (node->getOp() == glslang::EOpCooperativeMatrixLoad) {4187idImmOps.push_back(spv::IdImmediate(true, operands[3])); // matrixLayout4188auto layout = (spv::CooperativeMatrixLayout)builder.getConstantScalar(operands[3]);4189if (layout == spv::CooperativeMatrixLayout::RowBlockedInterleavedARM ||4190layout == spv::CooperativeMatrixLayout::ColumnBlockedInterleavedARM) {4191builder.addExtension(spv::E_SPV_ARM_cooperative_matrix_layouts);4192builder.addCapability(spv::Capability::CooperativeMatrixLayoutsARM);4193}4194idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride4195} else {4196idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride4197idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor4198}4199idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());4200// get the pointee type4201spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));4202assert(builder.isCooperativeMatrixType(typeId));4203// do the op4204spv::Id result = node->getOp() == glslang::EOpCooperativeMatrixLoad4205? builder.createOp(spv::Op::OpCooperativeMatrixLoadKHR, typeId, idImmOps)4206: builder.createOp(spv::Op::OpCooperativeMatrixLoadNV, typeId, idImmOps);4207// store the result to the pointer (out param 'm')4208builder.createStore(result, operands[0]);4209result = 0;4210} else if (node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV) {4211std::vector<spv::IdImmediate> idImmOps;42124213idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf4214idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object42154216builder.addCapability(spv::Capability::CooperativeMatrixTensorAddressingNV);4217builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);42184219idImmOps.push_back(spv::IdImmediate(true, operands[2])); // tensorLayout42204221idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end()); // memoryaccess42224223if (operands.size() > 3) {4224idImmOps.push_back(spv::IdImmediate(false, spv::TensorAddressingOperandsMask::TensorView));4225idImmOps.push_back(spv::IdImmediate(true, operands[3])); // tensorView4226} else {4227idImmOps.push_back(spv::IdImmediate(false, 0));4228}42294230builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreTensorNV, idImmOps);4231result = 0;4232} else if (node->getOp() == glslang::EOpCooperativeMatrixStore ||4233node->getOp() == glslang::EOpCooperativeMatrixStoreNV) {4234std::vector<spv::IdImmediate> idImmOps;42354236idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf4237idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object4238if (node->getOp() == glslang::EOpCooperativeMatrixStore) {4239idImmOps.push_back(spv::IdImmediate(true, operands[3])); // matrixLayout4240auto layout = (spv::CooperativeMatrixLayout)builder.getConstantScalar(operands[3]);4241if (layout == spv::CooperativeMatrixLayout::RowBlockedInterleavedARM ||4242layout == spv::CooperativeMatrixLayout::ColumnBlockedInterleavedARM) {4243builder.addExtension(spv::E_SPV_ARM_cooperative_matrix_layouts);4244builder.addCapability(spv::Capability::CooperativeMatrixLayoutsARM);4245}4246idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride4247} else {4248idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride4249idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor4250}4251idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());42524253if (node->getOp() == glslang::EOpCooperativeMatrixStore)4254builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreKHR, idImmOps);4255else4256builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreNV, idImmOps);4257result = 0;4258} else if (node->getOp() == glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT) {4259std::vector<spv::IdImmediate> idImmOps;42604261idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q4262idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed42634264spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),4265builder.makeUintConstant(3), 0);4266// do the op42674268spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionTriangleVertexPositionsKHR;42694270spv::Id result = builder.createOp(spvOp, typeId, idImmOps);4271// store the result to the pointer (out param 'm')4272builder.createStore(result, operands[2]);4273result = 0;4274} else if (node->getOp() == glslang::EOpRayQueryGetIntersectionLSSPositionsNV) {4275std::vector<spv::IdImmediate> idImmOps;42764277idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q4278idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed42794280spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),4281builder.makeUintConstant(2), 0);4282// do the op42834284spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionLSSPositionsNV;42854286spv::Id result = builder.createOp(spvOp, typeId, idImmOps);4287// store the result to the pointer (out param 'm')4288builder.createStore(result, operands[2]);4289result = 0;4290} else if (node->getOp() == glslang::EOpRayQueryGetIntersectionLSSRadiiNV) {4291std::vector<spv::IdImmediate> idImmOps;42924293idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q4294idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed42954296spv::Id typeId = builder.makeArrayType(builder.makeFloatType(32),4297builder.makeUintConstant(2), 0);4298// do the op42994300spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionLSSRadiiNV;43014302spv::Id result = builder.createOp(spvOp, typeId, idImmOps);4303// store the result to the pointer (out param 'm')4304builder.createStore(result, operands[2]);4305result = 0;4306} else if (node->getOp() == glslang::EOpHitObjectGetLSSPositionsNV) {4307std::vector<spv::IdImmediate> idImmOps;43084309idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject43104311spv::Op spvOp = spv::Op::OpHitObjectGetLSSPositionsNV;4312spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),4313builder.makeUintConstant(2), 0);43144315spv::Id result = builder.createOp(spvOp, typeId, idImmOps);4316// store the result to the pointer (out param 'm')4317builder.createStore(result, operands[1]);4318result = 0;4319} else if (node->getOp() == glslang::EOpHitObjectGetLSSRadiiNV) {4320std::vector<spv::IdImmediate> idImmOps;43214322idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject43234324spv::Op spvOp = spv::Op::OpHitObjectGetLSSRadiiNV;4325spv::Id typeId = builder.makeArrayType(builder.makeFloatType(32),4326builder.makeUintConstant(2), 0);43274328spv::Id result = builder.createOp(spvOp, typeId, idImmOps);4329// store the result to the pointer (out param 'm')4330builder.createStore(result, operands[1]);4331result = 0;4332} else if (node->getOp() == glslang::EOpHitObjectGetIntersectionTriangleVertexPositionsEXT) {4333std::vector<spv::IdImmediate> idImmOps;43344335idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject43364337spv::Op spvOp = spv::Op::OpHitObjectGetIntersectionTriangleVertexPositionsEXT;4338spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),4339builder.makeUintConstant(3), 0);43404341spv::Id result = builder.createOp(spvOp, typeId, idImmOps);4342// store the result to the pointer (out param 'm')4343builder.createStore(result, operands[1]);4344result = 0;4345} else if (node->getOp() == glslang::EOpCooperativeMatrixMulAdd) {4346auto matrixOperands = spv::CooperativeMatrixOperandsMask::MaskNone;43474348// If the optional operand is present, initialize matrixOperands to that value.4349if (glslangOperands.size() == 4 && glslangOperands[3]->getAsConstantUnion()) {4350matrixOperands = (spv::CooperativeMatrixOperandsMask)glslangOperands[3]->getAsConstantUnion()->getConstArray()[0].getIConst();4351}43524353// Determine Cooperative Matrix Operands bits from the signedness of the types.4354if (isTypeSignedInt(glslangOperands[0]->getAsTyped()->getBasicType()))4355addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixASignedComponentsKHR);4356if (isTypeSignedInt(glslangOperands[1]->getAsTyped()->getBasicType()))4357addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixBSignedComponentsKHR);4358if (isTypeSignedInt(glslangOperands[2]->getAsTyped()->getBasicType()))4359addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixCSignedComponentsKHR);4360if (isTypeSignedInt(node->getBasicType()))4361addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixResultSignedComponentsKHR);43624363std::vector<spv::IdImmediate> idImmOps;4364idImmOps.push_back(spv::IdImmediate(true, operands[0]));4365idImmOps.push_back(spv::IdImmediate(true, operands[1]));4366idImmOps.push_back(spv::IdImmediate(true, operands[2]));4367if (matrixOperands != spv::CooperativeMatrixOperandsMask::MaskNone)4368idImmOps.push_back(spv::IdImmediate(false, matrixOperands));43694370result = builder.createOp(spv::Op::OpCooperativeMatrixMulAddKHR, resultType(), idImmOps);4371} else if (node->getOp() == glslang::EOpCooperativeMatrixReduceNV) {4372builder.addCapability(spv::Capability::CooperativeMatrixReductionsNV);4373builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);43744375spv::Op opcode = spv::Op::OpCooperativeMatrixReduceNV;4376unsigned mask = glslangOperands[2]->getAsConstantUnion()->getConstArray()[0].getUConst();43774378spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));4379assert(builder.isCooperativeMatrixType(typeId));43804381result = builder.createCooperativeMatrixReduce(opcode, typeId, operands[1], mask, operands[3]);4382// store the result to the pointer (out param 'm')4383builder.createStore(result, operands[0]);4384result = 0;4385} else if (node->getOp() == glslang::EOpCooperativeMatrixPerElementOpNV) {4386builder.addCapability(spv::Capability::CooperativeMatrixPerElementOperationsNV);4387builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);43884389spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));4390assert(builder.isCooperativeMatrixType(typeId));43914392result = builder.createCooperativeMatrixPerElementOp(typeId, operands);4393// store the result to the pointer4394builder.createStore(result, operands[0]);4395result = 0;4396} else if (node->getOp() == glslang::EOpCooperativeMatrixTransposeNV) {43974398builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);4399builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);44004401spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));4402assert(builder.isCooperativeMatrixType(typeId));44034404result = builder.createUnaryOp(spv::Op::OpCooperativeMatrixTransposeNV, typeId, operands[1]);4405// store the result to the pointer4406builder.createStore(result, operands[0]);4407result = 0;4408} else if (node->getOp() == glslang::EOpBitCastArrayQCOM) {4409builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);4410builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);4411result = builder.createUnaryOp(spv::Op::OpBitCastArrayQCOM, resultType(), operands[0]);4412} else if (node->getOp() == glslang::EOpCompositeConstructCoopMatQCOM) {4413builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);4414builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);4415result = builder.createUnaryOp(spv::Op::OpCompositeConstructCoopMatQCOM, resultType(), operands[0]);4416} else if (node->getOp() == glslang::EOpCompositeExtractCoopMatQCOM) {4417builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);4418builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);4419result = builder.createUnaryOp(spv::Op::OpCompositeExtractCoopMatQCOM, resultType(), operands[0]);4420} else if (node->getOp() == glslang::EOpExtractSubArrayQCOM) {4421builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);4422builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);44234424std::vector<spv::Id> arguments { operands[0], operands[1] };;4425result = builder.createOp(spv::Op::OpExtractSubArrayQCOM, resultType(), arguments);4426} else if (node->getOp() == glslang::EOpCooperativeVectorMatMulNV ||4427node->getOp() == glslang::EOpCooperativeVectorMatMulAddNV) {4428auto matrixOperands = spv::CooperativeMatrixOperandsMask::MaskNone;44294430bool isMulAdd = node->getOp() == glslang::EOpCooperativeVectorMatMulAddNV;44314432// Determine Cooperative Matrix Operands bits from the signedness of the types.44334434if (isTypeSignedInt(glslangOperands[1]->getAsTyped()->getBasicType()))4435addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixBSignedComponentsKHR);4436if (isTypeSignedInt(glslangOperands[0]->getAsTyped()->getBasicType()))4437addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixResultSignedComponentsKHR);44384439uint32_t opIdx = 1;4440std::vector<spv::IdImmediate> idImmOps;4441idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Input4442idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // InputInterpretation4443idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Matrix4444idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixOffset4445idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixInterpretation4446if (isMulAdd) {4447idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Bias4448idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // BiasOffset4449idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // BiasInterpretation4450}4451idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // M4452idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // K4453idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MemoryLayout4454idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Transpose4455idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixStride4456if (matrixOperands != spv::CooperativeMatrixOperandsMask::MaskNone)4457idImmOps.push_back(spv::IdImmediate(false, matrixOperands)); // Cooperative Matrix Operands44584459// get the pointee type4460spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));4461assert(builder.isCooperativeVectorType(typeId));4462// do the op4463spv::Id result = builder.createOp(isMulAdd ? spv::Op::OpCooperativeVectorMatrixMulAddNV : spv::Op::OpCooperativeVectorMatrixMulNV, typeId, idImmOps);4464// store the result to the pointer (out param 'res')4465builder.createStore(result, operands[0]);4466result = 0;4467} else if (node->getOp() == glslang::EOpCooperativeVectorLoadNV) {4468std::vector<spv::IdImmediate> idImmOps;44694470idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf4471idImmOps.push_back(spv::IdImmediate(true, operands[2])); // offset4472idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());4473// get the pointee type4474spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));4475assert(builder.isCooperativeVectorType(typeId));4476// do the op4477spv::Id result = builder.createOp(spv::Op::OpCooperativeVectorLoadNV, typeId, idImmOps);4478// store the result to the pointer (out param 'v')4479builder.createStore(result, operands[0]);4480result = 0;4481} else if (node->getOp() == glslang::EOpCooperativeVectorStoreNV) {4482std::vector<spv::IdImmediate> idImmOps;44834484idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf4485idImmOps.push_back(spv::IdImmediate(true, operands[2])); // offset4486idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object4487idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());4488builder.createNoResultOp(spv::Op::OpCooperativeVectorStoreNV, idImmOps);4489result = 0;4490} else if (node->getOp() == glslang::EOpCooperativeVectorOuterProductAccumulateNV) {4491builder.addCapability(spv::Capability::CooperativeVectorTrainingNV);4492builder.addExtension(spv::E_SPV_NV_cooperative_vector);44934494std::vector<spv::IdImmediate> idImmOps;44954496idImmOps.push_back(spv::IdImmediate(true, operands[2])); // Matrix4497idImmOps.push_back(spv::IdImmediate(true, operands[3])); // Offset4498idImmOps.push_back(spv::IdImmediate(true, operands[0])); // A4499idImmOps.push_back(spv::IdImmediate(true, operands[1])); // B4500idImmOps.push_back(spv::IdImmediate(true, operands[5])); // MemoryLayout4501idImmOps.push_back(spv::IdImmediate(true, operands[6])); // MatrixInterpretation4502idImmOps.push_back(spv::IdImmediate(true, operands[4])); // Stride4503builder.createNoResultOp(spv::Op::OpCooperativeVectorOuterProductAccumulateNV, idImmOps);4504result = 0;4505} else if (node->getOp() == glslang::EOpCooperativeVectorReduceSumAccumulateNV) {4506builder.addCapability(spv::Capability::CooperativeVectorTrainingNV);4507builder.addExtension(spv::E_SPV_NV_cooperative_vector);45084509std::vector<spv::IdImmediate> idImmOps;45104511idImmOps.push_back(spv::IdImmediate(true, operands[1])); // Buf4512idImmOps.push_back(spv::IdImmediate(true, operands[2])); // Offset4513idImmOps.push_back(spv::IdImmediate(true, operands[0])); // A4514builder.createNoResultOp(spv::Op::OpCooperativeVectorReduceSumAccumulateNV, idImmOps);4515result = 0;4516} else if (node->getOp() == glslang::EOpTensorReadARM ||4517node->getOp() == glslang::EOpTensorWriteARM) {4518const bool isWrite = node->getOp() == glslang::EOpTensorWriteARM;4519const unsigned int tensorMinOperandCount = 3;4520assert(operands.size() >= tensorMinOperandCount);4521std::vector<spv::IdImmediate> idImmOps;45224523idImmOps.push_back(spv::IdImmediate(true, operands[0])); // tensor4524idImmOps.push_back(spv::IdImmediate(true, operands[1])); // coords4525if (isWrite) {4526idImmOps.push_back(spv::IdImmediate(true, operands[2])); // value4527}45284529// Analyze the tensor operands4530spv::IdImmediate tensorOperands = { false, uint32_t(spv::TensorOperandsMask::MaskNone) };4531bool pushExtraArg = false;4532if (operands.size() > tensorMinOperandCount) {4533auto enumVal = builder.getConstantScalar(operands[tensorMinOperandCount]);45344535if (enumVal & uint32_t(spv::TensorOperandsMask::NontemporalARM)) {4536tensorOperands.word |= uint32_t(spv::TensorOperandsMask::NontemporalARM);4537}4538if (enumVal & uint32_t(spv::TensorOperandsMask::OutOfBoundsValueARM)) {4539tensorOperands.word |= uint32_t(spv::TensorOperandsMask::OutOfBoundsValueARM);4540assert(operands.size() >= tensorMinOperandCount + 2 &&4541"TensorOperandsOutOfBoundsValueMask requires an additional value");4542pushExtraArg = true;4543}4544}45454546// Append optional tensor operands if the mask was non-zero.4547if (tensorOperands.word) {4548idImmOps.push_back(tensorOperands);4549if (pushExtraArg)4550idImmOps.push_back(spv::IdImmediate(true, operands[tensorMinOperandCount + 1]));4551}45524553if (isWrite) {4554builder.createNoResultOp(spv::Op::OpTensorWriteARM, idImmOps);4555result = 0;4556} else {4557// Use the result argument type as the OpTensorReadARM result type.4558const glslang::TType &resArgType = glslangOperands[2]->getAsTyped()->getType();4559spv::Id retType = convertGlslangToSpvType(resArgType);4560result = builder.createOp(spv::Op::OpTensorReadARM, retType, idImmOps);4561// Store the result to the result argument.4562builder.createStore(result, operands[2]);4563}4564} else if (node->getOp() == glslang::EOpTensorSizeARM) {4565// Expected operands are (tensor, dimension)4566assert(operands.size() == 2);45674568spv::Id tensorOp = operands[0];4569spv::Id dimOp = operands[1];4570assert(builder.isTensorTypeARM(builder.getTypeId(tensorOp)) && "operand #0 must be a tensor");45714572std::vector<spv::IdImmediate> idImmOps;4573idImmOps.push_back(spv::IdImmediate(true, tensorOp));4574idImmOps.push_back(spv::IdImmediate(true, dimOp));4575result = builder.createOp(spv::Op::OpTensorQuerySizeARM, resultType(), idImmOps);4576} else if (atomic) {4577// Handle all atomics4578glslang::TBasicType typeProxy = (node->getOp() == glslang::EOpAtomicStore)4579? node->getSequence()[0]->getAsTyped()->getBasicType() : node->getBasicType();4580result = createAtomicOperation(node->getOp(), precision, resultType(), operands, typeProxy,4581lvalueCoherentFlags, node->getType());4582} else if (node->getOp() == glslang::EOpSpirvInst) {4583const auto& spirvInst = node->getSpirvInstruction();4584if (spirvInst.set == "") {4585std::vector<spv::IdImmediate> idImmOps;4586for (unsigned int i = 0; i < glslangOperands.size(); ++i) {4587if (glslangOperands[i]->getAsTyped()->getQualifier().isSpirvLiteral()) {4588// Translate the constant to a literal value4589std::vector<unsigned> literals;4590glslang::TVector<const glslang::TIntermConstantUnion*> constants;4591constants.push_back(glslangOperands[i]->getAsConstantUnion());4592TranslateLiterals(constants, literals);4593idImmOps.push_back({false, literals[0]});4594} else4595idImmOps.push_back({true, operands[i]});4596}45974598if (node->getBasicType() == glslang::EbtVoid)4599builder.createNoResultOp(static_cast<spv::Op>(spirvInst.id), idImmOps);4600else4601result = builder.createOp(static_cast<spv::Op>(spirvInst.id), resultType(), idImmOps);4602} else {4603result = builder.createBuiltinCall(4604resultType(), spirvInst.set == "GLSL.std.450" ? stdBuiltins : getExtBuiltins(spirvInst.set.c_str()),4605spirvInst.id, operands);4606}4607noReturnValue = node->getBasicType() == glslang::EbtVoid;4608} else if (node->getOp() == glslang::EOpDebugPrintf) {4609if (!nonSemanticDebugPrintf) {4610nonSemanticDebugPrintf = builder.import("NonSemantic.DebugPrintf");4611}4612result = builder.createBuiltinCall(builder.makeVoidType(), nonSemanticDebugPrintf, spv::NonSemanticDebugPrintfDebugPrintf, operands);4613builder.addExtension(spv::E_SPV_KHR_non_semantic_info);4614} else {4615// Pass through to generic operations.4616switch (glslangOperands.size()) {4617case 0:4618result = createNoArgOperation(node->getOp(), precision, resultType());4619break;4620case 1:4621{4622OpDecorations decorations = { precision,4623TranslateNoContractionDecoration(node->getType().getQualifier()),4624TranslateNonUniformDecoration(node->getType().getQualifier()) };4625result = createUnaryOperation(4626node->getOp(), decorations,4627resultType(), operands.front(),4628glslangOperands[0]->getAsTyped()->getBasicType(), lvalueCoherentFlags, node->getType());4629}4630break;4631default:4632result = createMiscOperation(node->getOp(), precision, resultType(), operands, node->getBasicType());4633break;4634}46354636if (invertedType != spv::NoResult)4637result = createInvertedSwizzle(precision, *glslangOperands[0]->getAsBinaryNode(), result);46384639for (unsigned int i = 0; i < temporaryLvalues.size(); ++i) {4640builder.setAccessChain(complexLvalues[i]);4641builder.accessChainStore(builder.createLoad(temporaryLvalues[i], spv::NoPrecision),4642TranslateNonUniformDecoration(complexLvalues[i].coherentFlags));4643}4644}46454646if (noReturnValue)4647return false;46484649if (! result) {4650logger->missingFunctionality("unknown glslang aggregate");4651return true; // pick up a child as a placeholder operand4652} else {4653builder.clearAccessChain();4654builder.setAccessChainRValue(result);4655return false;4656}4657}46584659// This path handles both if-then-else and ?:4660// The if-then-else has a node type of void, while4661// ?: has either a void or a non-void node type4662//4663// Leaving the result, when not void:4664// GLSL only has r-values as the result of a :?, but4665// if we have an l-value, that can be more efficient if it will4666// become the base of a complex r-value expression, because the4667// next layer copies r-values into memory to use the access-chain mechanism4668bool TGlslangToSpvTraverser::visitSelection(glslang::TVisit /* visit */, glslang::TIntermSelection* node)4669{4670// see if OpSelect can handle it4671const auto isOpSelectable = [&]() {4672if (node->getBasicType() == glslang::EbtVoid)4673return false;4674// OpSelect can do all other types starting with SPV 1.44675if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_4) {4676// pre-1.4, only scalars and vectors can be handled4677if ((!node->getType().isScalar() && !node->getType().isVector()))4678return false;4679}4680return true;4681};46824683// See if it simple and safe, or required, to execute both sides.4684// Crucially, side effects must be either semantically required or avoided,4685// and there are performance trade-offs.4686// Return true if required or a good idea (and safe) to execute both sides,4687// false otherwise.4688const auto bothSidesPolicy = [&]() -> bool {4689// do we have both sides?4690if (node->getTrueBlock() == nullptr ||4691node->getFalseBlock() == nullptr)4692return false;46934694// required? (unless we write additional code to look for side effects4695// and make performance trade-offs if none are present)4696if (!node->getShortCircuit())4697return true;46984699// if not required to execute both, decide based on performance/practicality...47004701if (!isOpSelectable())4702return false;47034704assert(node->getType() == node->getTrueBlock() ->getAsTyped()->getType() &&4705node->getType() == node->getFalseBlock()->getAsTyped()->getType());47064707// return true if a single operand to ? : is okay for OpSelect4708const auto operandOkay = [](glslang::TIntermTyped* node) {4709return node->getAsSymbolNode() || node->getType().getQualifier().isConstant();4710};47114712return operandOkay(node->getTrueBlock() ->getAsTyped()) &&4713operandOkay(node->getFalseBlock()->getAsTyped());4714};47154716spv::Id result = spv::NoResult; // upcoming result selecting between trueValue and falseValue4717// emit the condition before doing anything with selection4718node->getCondition()->traverse(this);4719spv::Id condition = accessChainLoad(node->getCondition()->getType());47204721// Find a way of executing both sides and selecting the right result.4722const auto executeBothSides = [&]() -> void {4723// execute both sides4724spv::Id resultType = convertGlslangToSpvType(node->getType());4725node->getTrueBlock()->traverse(this);4726spv::Id trueValue = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());4727node->getFalseBlock()->traverse(this);4728spv::Id falseValue = accessChainLoad(node->getFalseBlock()->getAsTyped()->getType());47294730builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());47314732// done if void4733if (node->getBasicType() == glslang::EbtVoid)4734return;47354736// emit code to select between trueValue and falseValue4737// see if OpSelect can handle the result type, and that the SPIR-V types4738// of the inputs match the result type.4739if (isOpSelectable()) {4740// Emit OpSelect for this selection.47414742// smear condition to vector, if necessary (AST is always scalar)4743// Before 1.4, smear like for mix(), starting with 1.4, keep it scalar4744if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_4 && builder.isVector(trueValue)) {4745condition = builder.smearScalar(spv::NoPrecision, condition,4746builder.makeVectorType(builder.makeBoolType(),4747builder.getNumComponents(trueValue)));4748}47494750// If the types do not match, it is because of mismatched decorations on aggregates.4751// Since isOpSelectable only lets us get here for SPIR-V >= 1.4, we can use OpCopyObject4752// to get matching types.4753if (builder.getTypeId(trueValue) != resultType) {4754trueValue = builder.createUnaryOp(spv::Op::OpCopyLogical, resultType, trueValue);4755}4756if (builder.getTypeId(falseValue) != resultType) {4757falseValue = builder.createUnaryOp(spv::Op::OpCopyLogical, resultType, falseValue);4758}47594760// OpSelect4761result = builder.createTriOp(spv::Op::OpSelect, resultType, condition, trueValue, falseValue);47624763builder.clearAccessChain();4764builder.setAccessChainRValue(result);4765} else {4766// We need control flow to select the result.4767// TODO: Once SPIR-V OpSelect allows arbitrary types, eliminate this path.4768result = builder.createVariable(TranslatePrecisionDecoration(node->getType()),4769spv::StorageClass::Function, resultType);47704771// Selection control:4772const spv::SelectionControlMask control = TranslateSelectionControl(*node);47734774// make an "if" based on the value created by the condition4775spv::Builder::If ifBuilder(condition, control, builder);47764777// emit the "then" statement4778builder.clearAccessChain();4779builder.setAccessChainLValue(result);4780multiTypeStore(node->getType(), trueValue);47814782ifBuilder.makeBeginElse();4783// emit the "else" statement4784builder.clearAccessChain();4785builder.setAccessChainLValue(result);4786multiTypeStore(node->getType(), falseValue);47874788// finish off the control flow4789ifBuilder.makeEndIf();47904791builder.clearAccessChain();4792builder.setAccessChainLValue(result);4793}4794};47954796// Execute the one side needed, as per the condition4797const auto executeOneSide = [&]() {4798// Always emit control flow.4799if (node->getBasicType() != glslang::EbtVoid) {4800result = builder.createVariable(TranslatePrecisionDecoration(node->getType()), spv::StorageClass::Function,4801convertGlslangToSpvType(node->getType()));4802}48034804// Selection control:4805const spv::SelectionControlMask control = TranslateSelectionControl(*node);48064807// make an "if" based on the value created by the condition4808spv::Builder::If ifBuilder(condition, control, builder);48094810// emit the "then" statement4811if (node->getTrueBlock() != nullptr) {4812node->getTrueBlock()->traverse(this);4813if (result != spv::NoResult) {4814spv::Id load = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());48154816builder.clearAccessChain();4817builder.setAccessChainLValue(result);4818multiTypeStore(node->getType(), load);4819}4820}48214822if (node->getFalseBlock() != nullptr) {4823ifBuilder.makeBeginElse();4824// emit the "else" statement4825node->getFalseBlock()->traverse(this);4826if (result != spv::NoResult) {4827spv::Id load = accessChainLoad(node->getFalseBlock()->getAsTyped()->getType());48284829builder.clearAccessChain();4830builder.setAccessChainLValue(result);4831multiTypeStore(node->getType(), load);4832}4833}48344835// finish off the control flow4836ifBuilder.makeEndIf();48374838if (result != spv::NoResult) {4839builder.clearAccessChain();4840builder.setAccessChainLValue(result);4841}4842};48434844// Try for OpSelect (or a requirement to execute both sides)4845if (bothSidesPolicy()) {4846SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);4847if (node->getType().getQualifier().isSpecConstant())4848spec_constant_op_mode_setter.turnOnSpecConstantOpMode();4849executeBothSides();4850} else4851executeOneSide();48524853return false;4854}48554856bool TGlslangToSpvTraverser::visitSwitch(glslang::TVisit /* visit */, glslang::TIntermSwitch* node)4857{4858// emit and get the condition before doing anything with switch4859node->getCondition()->traverse(this);4860spv::Id selector = accessChainLoad(node->getCondition()->getAsTyped()->getType());48614862// Selection control:4863const spv::SelectionControlMask control = TranslateSwitchControl(*node);48644865// browse the children to sort out code segments4866int defaultSegment = -1;4867std::vector<TIntermNode*> codeSegments;4868glslang::TIntermSequence& sequence = node->getBody()->getSequence();4869std::vector<int> caseValues;4870std::vector<int> valueIndexToSegment(sequence.size()); // note: probably not all are used, it is an overestimate4871for (glslang::TIntermSequence::iterator c = sequence.begin(); c != sequence.end(); ++c) {4872TIntermNode* child = *c;4873if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpDefault)4874defaultSegment = (int)codeSegments.size();4875else if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpCase) {4876valueIndexToSegment[caseValues.size()] = (int)codeSegments.size();4877caseValues.push_back(child->getAsBranchNode()->getExpression()->getAsConstantUnion()4878->getConstArray()[0].getIConst());4879} else4880codeSegments.push_back(child);4881}48824883// handle the case where the last code segment is missing, due to no code4884// statements between the last case and the end of the switch statement4885if ((caseValues.size() && (int)codeSegments.size() == valueIndexToSegment[caseValues.size() - 1]) ||4886(int)codeSegments.size() == defaultSegment)4887codeSegments.push_back(nullptr);48884889// make the switch statement4890std::vector<spv::Block*> segmentBlocks; // returned, as the blocks allocated in the call4891builder.makeSwitch(selector, control, (int)codeSegments.size(), caseValues, valueIndexToSegment, defaultSegment,4892segmentBlocks);48934894// emit all the code in the segments4895breakForLoop.push(false);4896for (unsigned int s = 0; s < codeSegments.size(); ++s) {4897builder.nextSwitchSegment(segmentBlocks, s);4898if (codeSegments[s])4899codeSegments[s]->traverse(this);4900else4901builder.addSwitchBreak(true);4902}4903breakForLoop.pop();49044905builder.endSwitch(segmentBlocks);49064907return false;4908}49094910void TGlslangToSpvTraverser::visitConstantUnion(glslang::TIntermConstantUnion* node)4911{4912if (node->getQualifier().isSpirvLiteral())4913return; // Translated to a literal value, skip further processing49144915int nextConst = 0;4916spv::Id constant = createSpvConstantFromConstUnionArray(node->getType(), node->getConstArray(), nextConst, false);49174918builder.clearAccessChain();4919builder.setAccessChainRValue(constant);4920}49214922bool TGlslangToSpvTraverser::visitLoop(glslang::TVisit /* visit */, glslang::TIntermLoop* node)4923{4924auto blocks = builder.makeNewLoop();4925builder.createBranch(true, &blocks.head);49264927// Loop control:4928std::vector<unsigned int> operands;4929const spv::LoopControlMask control = TranslateLoopControl(*node, operands);49304931// Spec requires back edges to target header blocks, and every header block4932// must dominate its merge block. Make a header block first to ensure these4933// conditions are met. By definition, it will contain OpLoopMerge, followed4934// by a block-ending branch. But we don't want to put any other body/test4935// instructions in it, since the body/test may have arbitrary instructions,4936// including merges of its own.4937builder.setBuildPoint(&blocks.head);4938builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());4939builder.createLoopMerge(&blocks.merge, &blocks.continue_target, control, operands);4940if (node->testFirst() && node->getTest()) {4941spv::Block& test = builder.makeNewBlock();4942builder.createBranch(true, &test);49434944builder.setBuildPoint(&test);4945node->getTest()->traverse(this);4946spv::Id condition = accessChainLoad(node->getTestExpr()->getType());4947builder.createConditionalBranch(condition, &blocks.body, &blocks.merge);49484949builder.setBuildPoint(&blocks.body);4950breakForLoop.push(true);4951if (node->getBody())4952node->getBody()->traverse(this);4953builder.createBranch(true, &blocks.continue_target);4954breakForLoop.pop();49554956builder.setBuildPoint(&blocks.continue_target);4957if (node->getTerminal())4958node->getTerminal()->traverse(this);4959builder.createBranch(true, &blocks.head);4960} else {4961builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());4962builder.createBranch(true, &blocks.body);49634964breakForLoop.push(true);4965builder.setBuildPoint(&blocks.body);4966if (node->getBody())4967node->getBody()->traverse(this);4968builder.createBranch(true, &blocks.continue_target);4969breakForLoop.pop();49704971builder.setBuildPoint(&blocks.continue_target);4972if (node->getTerminal())4973node->getTerminal()->traverse(this);4974if (node->getTest()) {4975node->getTest()->traverse(this);4976spv::Id condition =4977accessChainLoad(node->getTestExpr()->getType());4978builder.createConditionalBranch(condition, &blocks.head, &blocks.merge);4979} else {4980// TODO: unless there was a break/return/discard instruction4981// somewhere in the body, this is an infinite loop, so we should4982// issue a warning.4983builder.createBranch(true, &blocks.head);4984}4985}4986builder.setBuildPoint(&blocks.merge);4987builder.closeLoop();4988return false;4989}49904991bool TGlslangToSpvTraverser::visitBranch(glslang::TVisit /* visit */, glslang::TIntermBranch* node)4992{4993if (node->getExpression())4994node->getExpression()->traverse(this);49954996builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());49974998switch (node->getFlowOp()) {4999case glslang::EOpKill:5000if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {5001builder.addCapability(spv::Capability::DemoteToHelperInvocation);5002builder.createNoResultOp(spv::Op::OpDemoteToHelperInvocationEXT);5003} else {5004builder.makeStatementTerminator(spv::Op::OpKill, "post-discard");5005}5006break;5007case glslang::EOpTerminateInvocation:5008builder.addExtension(spv::E_SPV_KHR_terminate_invocation);5009builder.makeStatementTerminator(spv::Op::OpTerminateInvocation, "post-terminate-invocation");5010break;5011case glslang::EOpBreak:5012if (breakForLoop.top())5013builder.createLoopExit();5014else5015builder.addSwitchBreak(false);5016break;5017case glslang::EOpContinue:5018builder.createLoopContinue();5019break;5020case glslang::EOpReturn:5021if (node->getExpression() != nullptr) {5022const glslang::TType& glslangReturnType = node->getExpression()->getType();5023spv::Id returnId = accessChainLoad(glslangReturnType);5024if (builder.getTypeId(returnId) != currentFunction->getReturnType() ||5025TranslatePrecisionDecoration(glslangReturnType) != currentFunction->getReturnPrecision()) {5026builder.clearAccessChain();5027spv::Id copyId = builder.createVariable(currentFunction->getReturnPrecision(),5028spv::StorageClass::Function, currentFunction->getReturnType());5029builder.setAccessChainLValue(copyId);5030multiTypeStore(glslangReturnType, returnId);5031returnId = builder.createLoad(copyId, currentFunction->getReturnPrecision());5032}5033builder.makeReturn(false, returnId);5034} else5035builder.makeReturn(false);50365037builder.clearAccessChain();5038break;50395040case glslang::EOpDemote:5041builder.createNoResultOp(spv::Op::OpDemoteToHelperInvocationEXT);5042builder.addExtension(spv::E_SPV_EXT_demote_to_helper_invocation);5043builder.addCapability(spv::Capability::DemoteToHelperInvocationEXT);5044break;5045case glslang::EOpTerminateRayKHR:5046builder.makeStatementTerminator(spv::Op::OpTerminateRayKHR, "post-terminateRayKHR");5047break;5048case glslang::EOpIgnoreIntersectionKHR:5049builder.makeStatementTerminator(spv::Op::OpIgnoreIntersectionKHR, "post-ignoreIntersectionKHR");5050break;50515052default:5053assert(0);5054break;5055}50565057return false;5058}50595060bool TGlslangToSpvTraverser::visitVariableDecl(glslang::TVisit visit, glslang::TIntermVariableDecl* node)5061{5062if (visit == glslang::EvPreVisit) {5063builder.setDebugSourceLocation(node->getDeclSymbol()->getLoc().line, node->getDeclSymbol()->getLoc().getFilename());5064// We touch the symbol once here to create the debug info.5065getSymbolId(node->getDeclSymbol());5066}50675068return true;5069}507050715072spv::Id TGlslangToSpvTraverser::createSpvVariable(const glslang::TIntermSymbol* node, spv::Id forcedType)5073{5074// First, steer off constants, which are not SPIR-V variables, but5075// can still have a mapping to a SPIR-V Id.5076// This includes specialization constants.5077if (node->getQualifier().isConstant()) {5078spv::Id result = createSpvConstant(*node);5079if (result != spv::NoResult) {5080auto name = node->getAsSymbolNode()->getAccessName().c_str();5081auto typeId = convertGlslangToSpvType(node->getType());5082builder.createConstVariable(typeId, name, result, currentFunction == nullptr);5083return result;5084}5085}50865087// Now, handle actual variables5088spv::StorageClass storageClass = TranslateStorageClass(node->getType());5089spv::Id spvType = forcedType == spv::NoType ? convertGlslangToSpvType(node->getType())5090: forcedType;50915092const bool contains16BitType = node->getType().contains16BitFloat() ||5093node->getType().contains16BitInt();5094if (contains16BitType) {5095switch (storageClass) {5096case spv::StorageClass::Input:5097case spv::StorageClass::Output:5098builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);5099builder.addCapability(spv::Capability::StorageInputOutput16);5100break;5101case spv::StorageClass::Uniform:5102builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);5103if (node->getType().getQualifier().storage == glslang::EvqBuffer)5104builder.addCapability(spv::Capability::StorageUniformBufferBlock16);5105else5106builder.addCapability(spv::Capability::StorageUniform16);5107break;5108case spv::StorageClass::PushConstant:5109builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);5110builder.addCapability(spv::Capability::StoragePushConstant16);5111break;5112case spv::StorageClass::StorageBuffer:5113case spv::StorageClass::PhysicalStorageBufferEXT:5114builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);5115builder.addCapability(spv::Capability::StorageUniformBufferBlock16);5116break;5117case spv::StorageClass::TileAttachmentQCOM:5118builder.addCapability(spv::Capability::TileShadingQCOM);5119break;5120default:5121if (storageClass == spv::StorageClass::Workgroup &&5122node->getType().getBasicType() == glslang::EbtBlock) {5123builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayout16BitAccessKHR);5124break;5125}5126if (node->getType().contains16BitFloat())5127builder.addCapability(spv::Capability::Float16);5128if (node->getType().contains16BitInt())5129builder.addCapability(spv::Capability::Int16);5130break;5131}5132}51335134if (node->getType().contains8BitInt()) {5135if (storageClass == spv::StorageClass::PushConstant) {5136builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);5137builder.addCapability(spv::Capability::StoragePushConstant8);5138} else if (storageClass == spv::StorageClass::Uniform) {5139builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);5140builder.addCapability(spv::Capability::UniformAndStorageBuffer8BitAccess);5141} else if (storageClass == spv::StorageClass::StorageBuffer) {5142builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);5143builder.addCapability(spv::Capability::StorageBuffer8BitAccess);5144} else if (storageClass == spv::StorageClass::Workgroup &&5145node->getType().getBasicType() == glslang::EbtBlock) {5146builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayout8BitAccessKHR);5147} else {5148builder.addCapability(spv::Capability::Int8);5149}5150}51515152const char* name = node->getName().c_str();5153if (glslang::IsAnonymous(name))5154name = "";51555156spv::Id initializer = spv::NoResult;51575158if (node->getType().getQualifier().storage == glslang::EvqUniform && !node->getConstArray().empty()) {5159int nextConst = 0;5160initializer = createSpvConstantFromConstUnionArray(node->getType(),5161node->getConstArray(),5162nextConst,5163false /* specConst */);5164} else if (node->getType().getQualifier().isNullInit()) {5165initializer = builder.makeNullConstant(spvType);5166}51675168spv::Id var = builder.createVariable(spv::NoPrecision, storageClass, spvType, name, initializer, false);51695170if (options.emitNonSemanticShaderDebugInfo && storageClass != spv::StorageClass::Function) {5171// Create variable alias for retargeted symbols if any.5172// Notably, this is only applicable to built-in variables so that it is okay to only use name as the key.5173auto [itBegin, itEnd] = glslangIntermediate->getBuiltinAliasLookup().equal_range(name);5174for (auto it = itBegin; it != itEnd; ++it) {5175builder.createDebugGlobalVariable(builder.getDebugType(spvType), it->second.c_str(), var);5176}5177}51785179std::vector<spv::Decoration> topLevelDecorations;5180glslang::TQualifier typeQualifier = node->getType().getQualifier();5181TranslateMemoryDecoration(typeQualifier, topLevelDecorations, glslangIntermediate->usingVulkanMemoryModel());5182for (auto deco : topLevelDecorations) {5183#ifdef __APPLE__5184if (deco != spv::Decoration::Restrict &&5185deco != spv::Decoration::RestrictPointer &&5186deco != spv::Decoration::RestrictPointerEXT)5187#endif5188builder.addDecoration(var, deco);5189}5190return var;5191}51925193// Return type Id of the sampled type.5194spv::Id TGlslangToSpvTraverser::getSampledType(const glslang::TSampler& sampler)5195{5196switch (sampler.type) {5197case glslang::EbtInt: return builder.makeIntType(32);5198case glslang::EbtUint: return builder.makeUintType(32);5199case glslang::EbtFloat: return builder.makeFloatType(32);5200case glslang::EbtFloat16:5201builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float_fetch);5202builder.addCapability(spv::Capability::Float16ImageAMD);5203return builder.makeFloatType(16);5204case glslang::EbtInt64:5205builder.addExtension(spv::E_SPV_EXT_shader_image_int64);5206builder.addCapability(spv::Capability::Int64ImageEXT);5207return builder.makeIntType(64);5208case glslang::EbtUint64:5209builder.addExtension(spv::E_SPV_EXT_shader_image_int64);5210builder.addCapability(spv::Capability::Int64ImageEXT);5211return builder.makeUintType(64);5212default:5213assert(0);5214return builder.makeFloatType(32);5215}5216}52175218// If node is a swizzle operation, return the type that should be used if5219// the swizzle base is first consumed by another operation, before the swizzle5220// is applied.5221spv::Id TGlslangToSpvTraverser::getInvertedSwizzleType(const glslang::TIntermTyped& node)5222{5223if (node.getAsOperator() &&5224node.getAsOperator()->getOp() == glslang::EOpVectorSwizzle)5225return convertGlslangToSpvType(node.getAsBinaryNode()->getLeft()->getType());5226else5227return spv::NoType;5228}52295230// When inverting a swizzle with a parent op, this function5231// will apply the swizzle operation to a completed parent operation.5232spv::Id TGlslangToSpvTraverser::createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped& node,5233spv::Id parentResult)5234{5235std::vector<unsigned> swizzle;5236convertSwizzle(*node.getAsBinaryNode()->getRight()->getAsAggregate(), swizzle);5237return builder.createRvalueSwizzle(precision, convertGlslangToSpvType(node.getType()), parentResult, swizzle);5238}52395240// Convert a glslang AST swizzle node to a swizzle vector for building SPIR-V.5241void TGlslangToSpvTraverser::convertSwizzle(const glslang::TIntermAggregate& node, std::vector<unsigned>& swizzle)5242{5243const glslang::TIntermSequence& swizzleSequence = node.getSequence();5244for (int i = 0; i < (int)swizzleSequence.size(); ++i)5245swizzle.push_back(swizzleSequence[i]->getAsConstantUnion()->getConstArray()[0].getIConst());5246}52475248// Convert from a glslang type to an SPV type, by calling into a5249// recursive version of this function. This establishes the inherited5250// layout state rooted from the top-level type.5251spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly)5252{5253return convertGlslangToSpvType(type, getExplicitLayout(type), type.getQualifier(), false, forwardReferenceOnly);5254}52555256spv::LinkageType TGlslangToSpvTraverser::convertGlslangLinkageToSpv(glslang::TLinkType linkType)5257{5258switch (linkType) {5259case glslang::ELinkExport:5260return spv::LinkageType::Export;5261default:5262return spv::LinkageType::Max;5263}5264}52655266// Do full recursive conversion of an arbitrary glslang type to a SPIR-V Id.5267// explicitLayout can be kept the same throughout the hierarchical recursive walk.5268// Mutually recursive with convertGlslangStructToSpvType().5269spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type,5270glslang::TLayoutPacking explicitLayout, const glslang::TQualifier& qualifier,5271bool lastBufferBlockMember, bool forwardReferenceOnly)5272{5273spv::Id spvType = spv::NoResult;52745275switch (type.getBasicType()) {5276case glslang::EbtVoid:5277spvType = builder.makeVoidType();5278assert (! type.isArray());5279break;5280case glslang::EbtBool:5281// "transparent" bool doesn't exist in SPIR-V. The GLSL convention is5282// a 32-bit int where non-0 means true.5283if (explicitLayout != glslang::ElpNone)5284spvType = builder.makeUintType(32);5285else5286spvType = builder.makeBoolType();5287break;5288case glslang::EbtInt:5289spvType = builder.makeIntType(32);5290break;5291case glslang::EbtUint:5292spvType = builder.makeUintType(32);5293break;5294case glslang::EbtFloat:5295spvType = builder.makeFloatType(32);5296break;5297case glslang::EbtDouble:5298spvType = builder.makeFloatType(64);5299break;5300case glslang::EbtFloat16:5301spvType = builder.makeFloatType(16);5302break;5303case glslang::EbtBFloat16:5304spvType = builder.makeBFloat16Type();5305break;5306case glslang::EbtFloatE5M2:5307spvType = builder.makeFloatE5M2Type();5308break;5309case glslang::EbtFloatE4M3:5310spvType = builder.makeFloatE4M3Type();5311break;5312case glslang::EbtInt8:5313spvType = builder.makeIntType(8);5314break;5315case glslang::EbtUint8:5316spvType = builder.makeUintType(8);5317break;5318case glslang::EbtInt16:5319spvType = builder.makeIntType(16);5320break;5321case glslang::EbtUint16:5322spvType = builder.makeUintType(16);5323break;5324case glslang::EbtInt64:5325spvType = builder.makeIntType(64);5326break;5327case glslang::EbtUint64:5328spvType = builder.makeUintType(64);5329break;5330case glslang::EbtAtomicUint:5331builder.addCapability(spv::Capability::AtomicStorage);5332spvType = builder.makeUintType(32);5333break;5334case glslang::EbtAccStruct:5335switch (glslangIntermediate->getStage()) {5336case EShLangRayGen:5337case EShLangIntersect:5338case EShLangAnyHit:5339case EShLangClosestHit:5340case EShLangMiss:5341case EShLangCallable:5342// these all should have the RayTracingNV/KHR capability already5343break;5344default:5345{5346auto& extensions = glslangIntermediate->getRequestedExtensions();5347if (extensions.find("GL_EXT_ray_query") != extensions.end()) {5348builder.addExtension(spv::E_SPV_KHR_ray_query);5349builder.addCapability(spv::Capability::RayQueryKHR);5350}5351}5352break;5353}5354spvType = builder.makeAccelerationStructureType();5355break;5356case glslang::EbtRayQuery:5357{5358auto& extensions = glslangIntermediate->getRequestedExtensions();5359if (extensions.find("GL_EXT_ray_query") != extensions.end()) {5360builder.addExtension(spv::E_SPV_KHR_ray_query);5361builder.addCapability(spv::Capability::RayQueryKHR);5362}5363spvType = builder.makeRayQueryType();5364}5365break;5366case glslang::EbtReference:5367{5368// Make the forward pointer, then recurse to convert the structure type, then5369// patch up the forward pointer with a real pointer type.5370if (forwardPointers.find(type.getReferentType()) == forwardPointers.end()) {5371spv::Id forwardId = builder.makeForwardPointer(spv::StorageClass::PhysicalStorageBufferEXT);5372forwardPointers[type.getReferentType()] = forwardId;5373}5374spvType = forwardPointers[type.getReferentType()];5375if (!forwardReferenceOnly) {5376spv::Id referentType = convertGlslangToSpvType(*type.getReferentType());5377builder.makePointerFromForwardPointer(spv::StorageClass::PhysicalStorageBufferEXT,5378forwardPointers[type.getReferentType()],5379referentType);5380}5381}5382break;5383case glslang::EbtSampler:5384{5385const glslang::TSampler& sampler = type.getSampler();5386std::string debugName;53875388if (sampler.isPureSampler()) {5389if (options.emitNonSemanticShaderDebugInfo) {5390if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {5391debugName = sampler.getString();5392}5393else {5394debugName = "type.sampler";5395}5396}5397spvType = builder.makeSamplerType(debugName.c_str());5398} else {5399// an image is present, make its type5400if (options.emitNonSemanticShaderDebugInfo) {5401if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {5402debugName = sampler.removeCombined().getString();5403}5404else {5405switch (sampler.dim) {5406case glslang::Esd1D: debugName = "type.1d.image"; break;5407case glslang::Esd2D: debugName = "type.2d.image"; break;5408case glslang::Esd3D: debugName = "type.3d.image"; break;5409case glslang::EsdCube: debugName = "type.cube.image"; break;5410default: debugName = "type.image"; break;5411}5412}5413}5414spvType = builder.makeImageType(getSampledType(sampler), TranslateDimensionality(sampler),5415sampler.isShadow(), sampler.isArrayed(), sampler.isMultiSample(),5416sampler.isImageClass() ? 2 : 1, TranslateImageFormat(type), debugName.c_str());5417if (sampler.isCombined() &&5418(!sampler.isBuffer() || glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_6)) {5419// Already has both image and sampler, make the combined type. Only combine sampler to5420// buffer if before SPIR-V 1.6.5421if (options.emitNonSemanticShaderDebugInfo) {5422if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {5423debugName = sampler.getString();5424}5425else {5426debugName = "type.sampled.image";5427}5428}5429spvType = builder.makeSampledImageType(spvType, debugName.c_str());5430}5431}5432}5433break;5434case glslang::EbtStruct:5435case glslang::EbtBlock:5436{5437// If we've seen this struct type, return it5438const glslang::TTypeList* glslangMembers = type.getStruct();54395440// Try to share structs for different layouts, but not yet for other5441// kinds of qualification (primarily not yet including interpolant qualification).5442if (! HasNonLayoutQualifiers(type, qualifier))5443spvType = structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers];5444if (spvType != spv::NoResult)5445break;54465447// else, we haven't seen it...5448if (type.getBasicType() == glslang::EbtBlock)5449memberRemapper[glslangTypeToIdMap[glslangMembers]].resize(glslangMembers->size());5450spvType = convertGlslangStructToSpvType(type, glslangMembers, explicitLayout, qualifier);5451}5452break;5453case glslang::EbtString:5454// no type used for OpString5455return 0;54565457case glslang::EbtHitObjectNV: {5458builder.addExtension(spv::E_SPV_NV_shader_invocation_reorder);5459builder.addCapability(spv::Capability::ShaderInvocationReorderNV);5460spvType = builder.makeHitObjectNVType();5461}5462break;54635464case glslang::EbtHitObjectEXT: {5465builder.addExtension(spv::E_SPV_EXT_shader_invocation_reorder);5466builder.addCapability(spv::Capability::ShaderInvocationReorderEXT);5467spvType = builder.makeHitObjectEXTType();5468}5469break;5470case glslang::EbtSpirvType: {5471// GL_EXT_spirv_intrinsics5472const auto& spirvType = type.getSpirvType();5473const auto& spirvInst = spirvType.spirvInst;54745475std::vector<spv::IdImmediate> operands;5476for (const auto& typeParam : spirvType.typeParams) {5477if (typeParam.getAsConstant() != nullptr) {5478// Constant expression5479auto constant = typeParam.getAsConstant();5480if (constant->isLiteral()) {5481if (constant->getBasicType() == glslang::EbtFloat) {5482float floatValue = static_cast<float>(constant->getConstArray()[0].getDConst());5483unsigned literal;5484static_assert(sizeof(literal) == sizeof(floatValue), "sizeof(unsigned) != sizeof(float)");5485memcpy(&literal, &floatValue, sizeof(literal));5486operands.push_back({false, literal});5487} else if (constant->getBasicType() == glslang::EbtInt) {5488unsigned literal = constant->getConstArray()[0].getIConst();5489operands.push_back({false, literal});5490} else if (constant->getBasicType() == glslang::EbtUint) {5491unsigned literal = constant->getConstArray()[0].getUConst();5492operands.push_back({false, literal});5493} else if (constant->getBasicType() == glslang::EbtBool) {5494unsigned literal = constant->getConstArray()[0].getBConst();5495operands.push_back({false, literal});5496} else if (constant->getBasicType() == glslang::EbtString) {5497auto str = constant->getConstArray()[0].getSConst()->c_str();5498unsigned literal = 0;5499char* literalPtr = reinterpret_cast<char*>(&literal);5500unsigned charCount = 0;5501char ch = 0;5502do {5503ch = *(str++);5504*(literalPtr++) = ch;5505++charCount;5506if (charCount == 4) {5507operands.push_back({false, literal});5508literalPtr = reinterpret_cast<char*>(&literal);5509charCount = 0;5510}5511} while (ch != 0);55125513// Partial literal is padded with 05514if (charCount > 0) {5515for (; charCount < 4; ++charCount)5516*(literalPtr++) = 0;5517operands.push_back({false, literal});5518}5519} else5520assert(0); // Unexpected type5521} else5522operands.push_back({true, createSpvConstant(*constant)});5523} else {5524// Type specifier5525assert(typeParam.getAsType() != nullptr);5526operands.push_back({true, convertGlslangToSpvType(*typeParam.getAsType())});5527}5528}55295530assert(spirvInst.set == ""); // Currently, couldn't be extended instructions.5531spvType = builder.makeGenericType(static_cast<spv::Op>(spirvInst.id), operands);55325533break;5534}5535case glslang::EbtTensorLayoutNV:5536{5537builder.addCapability(spv::Capability::TensorAddressingNV);5538builder.addExtension(spv::E_SPV_NV_tensor_addressing);55395540std::vector<spv::IdImmediate> operands;5541for (uint32_t i = 0; i < 2; ++i) {5542operands.push_back({true, makeArraySizeId(*type.getTypeParameters()->arraySizes, i, true)});5543}5544spvType = builder.makeGenericType(spv::Op::OpTypeTensorLayoutNV, operands);5545break;5546}5547case glslang::EbtTensorViewNV:5548{5549builder.addCapability(spv::Capability::TensorAddressingNV);5550builder.addExtension(spv::E_SPV_NV_tensor_addressing);55515552uint32_t dim = type.getTypeParameters()->arraySizes->getDimSize(0);5553assert(dim >= 1 && dim <= 5);5554std::vector<spv::IdImmediate> operands;5555for (uint32_t i = 0; i < dim + 2; ++i) {5556operands.push_back({true, makeArraySizeId(*type.getTypeParameters()->arraySizes, i, true, i==1)});5557}5558spvType = builder.makeGenericType(spv::Op::OpTypeTensorViewNV, operands);5559break;5560}5561default:5562assert(0);5563break;5564}55655566if (type.isMatrix())5567spvType = builder.makeMatrixType(spvType, type.getMatrixCols(), type.getMatrixRows());5568else {5569// If this variable has a vector element count greater than 1, create a SPIR-V vector5570if (type.getVectorSize() > 1)5571spvType = builder.makeVectorType(spvType, type.getVectorSize());5572}55735574if (type.isCoopMatNV()) {5575builder.addCapability(spv::Capability::CooperativeMatrixNV);5576builder.addExtension(spv::E_SPV_NV_cooperative_matrix);55775578if (type.getBasicType() == glslang::EbtFloat16)5579builder.addCapability(spv::Capability::Float16);5580if (type.getBasicType() == glslang::EbtUint8 ||5581type.getBasicType() == glslang::EbtInt8) {5582builder.addCapability(spv::Capability::Int8);5583}55845585spv::Id scope = makeArraySizeId(*type.getTypeParameters()->arraySizes, 1);5586spv::Id rows = makeArraySizeId(*type.getTypeParameters()->arraySizes, 2);5587spv::Id cols = makeArraySizeId(*type.getTypeParameters()->arraySizes, 3);55885589spvType = builder.makeCooperativeMatrixTypeNV(spvType, scope, rows, cols);5590}55915592if (type.isCoopMatKHR()) {5593builder.addCapability(spv::Capability::CooperativeMatrixKHR);5594builder.addExtension(spv::E_SPV_KHR_cooperative_matrix);55955596if (type.getBasicType() == glslang::EbtBFloat16) {5597builder.addExtension(spv::E_SPV_KHR_bfloat16);5598builder.addCapability(spv::Capability::BFloat16CooperativeMatrixKHR);5599}56005601if (type.getBasicType() == glslang::EbtFloatE5M2 || type.getBasicType() == glslang::EbtFloatE4M3) {5602builder.addExtension(spv::E_SPV_EXT_float8);5603builder.addCapability(spv::Capability::Float8CooperativeMatrixEXT);5604}56055606if (type.getBasicType() == glslang::EbtFloat16)5607builder.addCapability(spv::Capability::Float16);5608if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {5609builder.addCapability(spv::Capability::Int8);5610}56115612spv::Id scope = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);5613spv::Id rows = makeArraySizeId(*type.getTypeParameters()->arraySizes, 1);5614spv::Id cols = makeArraySizeId(*type.getTypeParameters()->arraySizes, 2);5615spv::Id use = makeArraySizeId(*type.getTypeParameters()->arraySizes, 3, true);56165617spvType = builder.makeCooperativeMatrixTypeKHR(spvType, scope, rows, cols, use);5618}5619else if (type.isTensorARM()) {5620builder.addCapability(spv::Capability::TensorsARM);5621builder.addExtension(spv::E_SPV_ARM_tensors);5622if (type.getBasicType() == glslang::EbtInt8 || type.getBasicType() == glslang::EbtUint8) {5623builder.addCapability(spv::Capability::Int8);5624} else if (type.getBasicType() == glslang::EbtInt16 ||5625type.getBasicType() == glslang::EbtUint16) {5626builder.addCapability(spv::Capability::Int16);5627} else if (type.getBasicType() == glslang::EbtInt64 ||5628type.getBasicType() == glslang::EbtUint64) {5629builder.addCapability(spv::Capability::Int64);5630} else if (type.getBasicType() == glslang::EbtFloat16) {5631builder.addCapability(spv::Capability::Float16);5632}56335634spv::Id rank = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);56355636spvType = builder.makeTensorTypeARM(spvType, rank);5637}56385639if (type.isCoopVecNV()) {5640builder.addCapability(spv::Capability::CooperativeVectorNV);5641builder.addExtension(spv::E_SPV_NV_cooperative_vector);56425643if (type.getBasicType() == glslang::EbtFloat16)5644builder.addCapability(spv::Capability::Float16);5645if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {5646builder.addCapability(spv::Capability::Int8);5647}56485649spv::Id components = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);56505651spvType = builder.makeCooperativeVectorTypeNV(spvType, components);5652}56535654if (type.isArray()) {5655int stride = 0; // keep this 0 unless doing an explicit layout; 0 will mean no decoration, no stride56565657// Do all but the outer dimension5658if (type.getArraySizes()->getNumDims() > 1) {5659// We need to decorate array strides for types needing explicit layout, except blocks.5660if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock) {5661// Use a dummy glslang type for querying internal strides of5662// arrays of arrays, but using just a one-dimensional array.5663glslang::TType simpleArrayType(type, 0); // deference type of the array5664while (simpleArrayType.getArraySizes()->getNumDims() > 1)5665simpleArrayType.getArraySizes()->dereference();56665667// Will compute the higher-order strides here, rather than making a whole5668// pile of types and doing repetitive recursion on their contents.5669stride = getArrayStride(simpleArrayType, explicitLayout, qualifier.layoutMatrix);5670}56715672// make the arrays5673for (int dim = type.getArraySizes()->getNumDims() - 1; dim > 0; --dim) {5674spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), dim), stride);5675if (stride > 0)5676builder.addDecoration(spvType, spv::Decoration::ArrayStride, stride);5677stride *= type.getArraySizes()->getDimSize(dim);5678}5679} else {5680// single-dimensional array, and don't yet have stride56815682// We need to decorate array strides for types needing explicit layout, except blocks.5683if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock)5684stride = getArrayStride(type, explicitLayout, qualifier.layoutMatrix);5685}56865687// Do the outer dimension, which might not be known for a runtime-sized array.5688// (Unsized arrays that survive through linking will be runtime-sized arrays)5689if (type.isSizedArray())5690spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), 0), stride);5691else {5692// If we see an runtime array in a buffer_reference, it is not a descriptor5693if (!lastBufferBlockMember && type.getBasicType() != glslang::EbtReference) {5694builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);5695builder.addCapability(spv::Capability::RuntimeDescriptorArrayEXT);5696}5697spvType = builder.makeRuntimeArray(spvType);5698}5699if (stride > 0)5700builder.addDecoration(spvType, spv::Decoration::ArrayStride, stride);5701}57025703return spvType;5704}57055706// Apply SPIR-V decorations to the SPIR-V object (provided by SPIR-V ID). If member index is provided, the5707// decorations are applied to this member.5708void TGlslangToSpvTraverser::applySpirvDecorate(const glslang::TType& type, spv::Id id, std::optional<int> member)5709{5710assert(type.getQualifier().hasSpirvDecorate());57115712const glslang::TSpirvDecorate& spirvDecorate = type.getQualifier().getSpirvDecorate();57135714// Add spirv_decorate5715for (auto& decorate : spirvDecorate.decorates) {5716if (!decorate.second.empty()) {5717std::vector<unsigned> literals;5718TranslateLiterals(decorate.second, literals);5719if (member.has_value())5720builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorate.first), literals);5721else5722builder.addDecoration(id, static_cast<spv::Decoration>(decorate.first), literals);5723} else {5724if (member.has_value())5725builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorate.first));5726else5727builder.addDecoration(id, static_cast<spv::Decoration>(decorate.first));5728}5729}57305731// Add spirv_decorate_id5732if (member.has_value()) {5733// spirv_decorate_id not applied to members5734assert(spirvDecorate.decorateIds.empty());5735} else {5736for (auto& decorateId : spirvDecorate.decorateIds) {5737std::vector<spv::Id> operandIds;5738assert(!decorateId.second.empty());5739for (auto extraOperand : decorateId.second) {5740if (extraOperand->getQualifier().isFrontEndConstant())5741operandIds.push_back(createSpvConstant(*extraOperand));5742else5743operandIds.push_back(getSymbolId(extraOperand->getAsSymbolNode()));5744}5745builder.addDecorationId(id, static_cast<spv::Decoration>(decorateId.first), operandIds);5746}5747}57485749// Add spirv_decorate_string5750for (auto& decorateString : spirvDecorate.decorateStrings) {5751std::vector<const char*> strings;5752assert(!decorateString.second.empty());5753for (auto extraOperand : decorateString.second) {5754const char* string = extraOperand->getConstArray()[0].getSConst()->c_str();5755strings.push_back(string);5756}5757if (member.has_value())5758builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorateString.first), strings);5759else5760builder.addDecoration(id, static_cast<spv::Decoration>(decorateString.first), strings);5761}5762}57635764// TODO: this functionality should exist at a higher level, in creating the AST5765//5766// Identify interface members that don't have their required extension turned on.5767//5768bool TGlslangToSpvTraverser::filterMember(const glslang::TType& member)5769{5770auto& extensions = glslangIntermediate->getRequestedExtensions();57715772if (member.getFieldName() == "gl_SecondaryViewportMaskNV" &&5773extensions.find("GL_NV_stereo_view_rendering") == extensions.end())5774return true;5775if (member.getFieldName() == "gl_SecondaryPositionNV" &&5776extensions.find("GL_NV_stereo_view_rendering") == extensions.end())5777return true;57785779if (glslangIntermediate->getStage() == EShLangMesh) {5780if (member.getFieldName() == "gl_PrimitiveShadingRateEXT" &&5781extensions.find("GL_EXT_fragment_shading_rate") == extensions.end())5782return true;5783}57845785if (glslangIntermediate->getStage() != EShLangMesh) {5786if (member.getFieldName() == "gl_ViewportMask" &&5787extensions.find("GL_NV_viewport_array2") == extensions.end())5788return true;5789if (member.getFieldName() == "gl_PositionPerViewNV" &&5790extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())5791return true;5792if (member.getFieldName() == "gl_ViewportMaskPerViewNV" &&5793extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())5794return true;5795}57965797return false;5798}57995800// Do full recursive conversion of a glslang structure (or block) type to a SPIR-V Id.5801// explicitLayout can be kept the same throughout the hierarchical recursive walk.5802// Mutually recursive with convertGlslangToSpvType().5803spv::Id TGlslangToSpvTraverser::convertGlslangStructToSpvType(const glslang::TType& type,5804const glslang::TTypeList* glslangMembers,5805glslang::TLayoutPacking explicitLayout,5806const glslang::TQualifier& qualifier)5807{5808// Create a vector of struct types for SPIR-V to consume5809std::vector<spv::Id> spvMembers;5810int memberDelta = 0; // how much the member's index changes from glslang to SPIR-V, normally 0,5811// except sometimes for blocks5812std::vector<std::pair<glslang::TType*, glslang::TQualifier> > deferredForwardPointers;5813std::vector<spv::StructMemberDebugInfo> memberDebugInfo;5814for (int i = 0; i < (int)glslangMembers->size(); i++) {5815auto& glslangMember = (*glslangMembers)[i];5816if (glslangMember.type->hiddenMember()) {5817++memberDelta;5818if (type.getBasicType() == glslang::EbtBlock)5819memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = -1;5820} else {5821if (type.getBasicType() == glslang::EbtBlock) {5822if (filterMember(*glslangMember.type)) {5823memberDelta++;5824memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = -1;5825continue;5826}5827memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = i - memberDelta;5828}5829// modify just this child's view of the qualifier5830glslang::TQualifier memberQualifier = glslangMember.type->getQualifier();5831InheritQualifiers(memberQualifier, qualifier);58325833// manually inherit location5834if (! memberQualifier.hasLocation() && qualifier.hasLocation())5835memberQualifier.layoutLocation = qualifier.layoutLocation;58365837// recurse5838bool lastBufferBlockMember = qualifier.storage == glslang::EvqBuffer &&5839i == (int)glslangMembers->size() - 1;58405841// Make forward pointers for any pointer members.5842if (glslangMember.type->isReference() &&5843forwardPointers.find(glslangMember.type->getReferentType()) == forwardPointers.end()) {5844deferredForwardPointers.push_back(std::make_pair(glslangMember.type, memberQualifier));5845}58465847// Create the member type.5848auto const spvMember = convertGlslangToSpvType(*glslangMember.type, explicitLayout, memberQualifier, lastBufferBlockMember,5849glslangMember.type->isReference());5850spvMembers.push_back(spvMember);58515852// Update the builder with the type's location so that we can create debug types for the structure members.5853// There doesn't exist a "clean" entry point for this information to be passed along to the builder so, for now,5854// it is stored in the builder and consumed during the construction of composite debug types.5855// TODO: This probably warrants further investigation. This approach was decided to be the least ugly of the5856// quick and dirty approaches that were tried.5857// Advantages of this approach:5858// + Relatively clean. No direct calls into debug type system.5859// + Handles nested recursive structures.5860// Disadvantages of this approach:5861// + Not as clean as desired. Traverser queries/sets persistent state. This is fragile.5862// + Table lookup during creation of composite debug types. This really shouldn't be necessary.5863if(options.emitNonSemanticShaderDebugInfo) {5864spv::StructMemberDebugInfo debugInfo{};5865debugInfo.name = glslangMember.type->getFieldName();5866debugInfo.line = glslangMember.loc.line;5867debugInfo.column = glslangMember.loc.column;58685869// Per the GLSL spec, bool variables inside of a uniform or buffer block are generated as uint.5870// But for debug info, we want to represent them as bool because that is the original type in5871// the source code. The bool type can be nested within a vector or a multidimensional array,5872// so we must construct the chain of types up from the scalar bool.5873if (glslangIntermediate->getSource() == glslang::EShSourceGlsl && explicitLayout != glslang::ElpNone &&5874glslangMember.type->getBasicType() == glslang::EbtBool) {5875auto typeId = builder.makeBoolType();5876if (glslangMember.type->isVector()) {5877typeId = builder.makeVectorType(typeId, glslangMember.type->getVectorSize());5878}5879if (glslangMember.type->isArray()) {5880const auto* arraySizes = glslangMember.type->getArraySizes();5881int dims = arraySizes->getNumDims();5882for (int i = dims - 1; i >= 0; --i) {5883spv::Id size = builder.makeIntConstant(arraySizes->getDimSize(i));5884typeId = builder.makeArrayType(typeId, size, 0);5885}5886}5887debugInfo.debugTypeOverride = builder.getDebugType(typeId);5888}58895890memberDebugInfo.push_back(debugInfo);5891}5892}5893}58945895// Make the SPIR-V type5896spv::Id spvType = builder.makeStructType(spvMembers, memberDebugInfo, type.getTypeName().c_str(), false);5897if (! HasNonLayoutQualifiers(type, qualifier))5898structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers] = spvType;58995900// Decorate it5901decorateStructType(type, glslangMembers, explicitLayout, qualifier, spvType, spvMembers);59025903for (int i = 0; i < (int)deferredForwardPointers.size(); ++i) {5904auto it = deferredForwardPointers[i];5905convertGlslangToSpvType(*it.first, explicitLayout, it.second, false);5906}59075908return spvType;5909}59105911void TGlslangToSpvTraverser::decorateStructType(const glslang::TType& type,5912const glslang::TTypeList* glslangMembers,5913glslang::TLayoutPacking explicitLayout,5914const glslang::TQualifier& qualifier,5915spv::Id spvType,5916const std::vector<spv::Id>& spvMembers)5917{5918// Name and decorate the non-hidden members5919int offset = -1;5920bool memberLocationInvalid = type.isArrayOfArrays() ||5921(type.isArray() && (type.getQualifier().isArrayedIo(glslangIntermediate->getStage()) == false));5922for (int i = 0; i < (int)glslangMembers->size(); i++) {5923glslang::TType& glslangMember = *(*glslangMembers)[i].type;5924int member = i;5925if (type.getBasicType() == glslang::EbtBlock) {5926member = memberRemapper[glslangTypeToIdMap[glslangMembers]][i];5927if (filterMember(glslangMember))5928continue;5929}59305931// modify just this child's view of the qualifier5932glslang::TQualifier memberQualifier = glslangMember.getQualifier();5933InheritQualifiers(memberQualifier, qualifier);59345935// using -1 above to indicate a hidden member5936if (member < 0)5937continue;59385939builder.addMemberName(spvType, member, glslangMember.getFieldName().c_str());5940builder.addMemberDecoration(spvType, member,5941TranslateLayoutDecoration(glslangMember, memberQualifier.layoutMatrix));5942builder.addMemberDecoration(spvType, member, TranslatePrecisionDecoration(glslangMember));5943// Add interpolation and auxiliary storage decorations only to5944// top-level members of Input and Output storage classes5945if (type.getQualifier().storage == glslang::EvqVaryingIn ||5946type.getQualifier().storage == glslang::EvqVaryingOut) {5947if (type.getBasicType() == glslang::EbtBlock ||5948glslangIntermediate->getSource() == glslang::EShSourceHlsl) {5949builder.addMemberDecoration(spvType, member, TranslateInterpolationDecoration(memberQualifier));5950builder.addMemberDecoration(spvType, member, TranslateAuxiliaryStorageDecoration(memberQualifier));5951addMeshNVDecoration(spvType, member, memberQualifier);5952}5953}5954builder.addMemberDecoration(spvType, member, TranslateInvariantDecoration(memberQualifier));59555956if (type.getBasicType() == glslang::EbtBlock &&5957qualifier.storage == glslang::EvqBuffer) {5958// Add memory decorations only to top-level members of shader storage block5959std::vector<spv::Decoration> memory;5960TranslateMemoryDecoration(memberQualifier, memory, glslangIntermediate->usingVulkanMemoryModel());5961for (unsigned int i = 0; i < memory.size(); ++i)5962builder.addMemberDecoration(spvType, member, memory[i]);5963}59645965// Location assignment was already completed correctly by the front end,5966// just track whether a member needs to be decorated.5967// Ignore member locations if the container is an array, as that's5968// ill-specified and decisions have been made to not allow this.5969if (!memberLocationInvalid && memberQualifier.hasLocation())5970builder.addMemberDecoration(spvType, member, spv::Decoration::Location, memberQualifier.layoutLocation);59715972// component, XFB, others5973if (glslangMember.getQualifier().hasComponent())5974builder.addMemberDecoration(spvType, member, spv::Decoration::Component,5975glslangMember.getQualifier().layoutComponent);5976if (glslangMember.getQualifier().hasXfbOffset())5977builder.addMemberDecoration(spvType, member, spv::Decoration::Offset,5978glslangMember.getQualifier().layoutXfbOffset);5979else if (explicitLayout != glslang::ElpNone) {5980// figure out what to do with offset, which is accumulating5981int nextOffset;5982updateMemberOffset(type, glslangMember, offset, nextOffset, explicitLayout, memberQualifier.layoutMatrix);5983if (offset >= 0)5984builder.addMemberDecoration(spvType, member, spv::Decoration::Offset, offset);5985offset = nextOffset;5986}59875988if (glslangMember.isMatrix() && explicitLayout != glslang::ElpNone)5989builder.addMemberDecoration(spvType, member, spv::Decoration::MatrixStride,5990getMatrixStride(glslangMember, explicitLayout, memberQualifier.layoutMatrix));59915992// built-in variable decorations5993spv::BuiltIn builtIn = TranslateBuiltInDecoration(glslangMember.getQualifier().builtIn, true);5994if (builtIn != spv::BuiltIn::Max)5995builder.addMemberDecoration(spvType, member, spv::Decoration::BuiltIn, (int)builtIn);59965997// nonuniform5998builder.addMemberDecoration(spvType, member, TranslateNonUniformDecoration(glslangMember.getQualifier()));59996000if (glslangIntermediate->getHlslFunctionality1() && memberQualifier.semanticName != nullptr) {6001builder.addExtension("SPV_GOOGLE_hlsl_functionality1");6002builder.addMemberDecoration(spvType, member, spv::Decoration::HlslSemanticGOOGLE,6003memberQualifier.semanticName);6004}60056006if (builtIn == spv::BuiltIn::Layer) {6007// SPV_NV_viewport_array2 extension6008if (glslangMember.getQualifier().layoutViewportRelative){6009builder.addMemberDecoration(spvType, member, spv::Decoration::ViewportRelativeNV);6010builder.addCapability(spv::Capability::ShaderViewportMaskNV);6011builder.addExtension(spv::E_SPV_NV_viewport_array2);6012}6013if (glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset != -2048){6014builder.addMemberDecoration(spvType, member,6015spv::Decoration::SecondaryViewportRelativeNV,6016glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset);6017builder.addCapability(spv::Capability::ShaderStereoViewNV);6018builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);6019}6020}6021if (glslangMember.getQualifier().layoutPassthrough) {6022builder.addMemberDecoration(spvType, member, spv::Decoration::PassthroughNV);6023builder.addCapability(spv::Capability::GeometryShaderPassthroughNV);6024builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);6025}60266027// Add SPIR-V decorations (GL_EXT_spirv_intrinsics)6028if (glslangMember.getQualifier().hasSpirvDecorate())6029applySpirvDecorate(glslangMember, spvType, member);6030}60316032// Decorate the structure6033builder.addDecoration(spvType, TranslateLayoutDecoration(type, qualifier.layoutMatrix));6034const auto basicType = type.getBasicType();6035const auto typeStorageQualifier = type.getQualifier().storage;6036if (basicType == glslang::EbtBlock) {6037builder.addDecoration(spvType, TranslateBlockDecoration(typeStorageQualifier, glslangIntermediate->usingStorageBuffer()));6038} else if (basicType == glslang::EbtStruct && glslangIntermediate->getSpv().vulkan > 0) {6039const auto hasRuntimeArray = !spvMembers.empty() && builder.getOpCode(spvMembers.back()) == spv::Op::OpTypeRuntimeArray;6040if (hasRuntimeArray) {6041builder.addDecoration(spvType, TranslateBlockDecoration(typeStorageQualifier, glslangIntermediate->usingStorageBuffer()));6042}6043}60446045if (qualifier.hasHitObjectShaderRecordNV())6046builder.addDecoration(spvType, spv::Decoration::HitObjectShaderRecordBufferNV);6047if (qualifier.hasHitObjectShaderRecordEXT())6048builder.addDecoration(spvType, spv::Decoration::HitObjectShaderRecordBufferEXT);6049}60506051// Turn the expression forming the array size into an id.6052// This is not quite trivial, because of specialization constants.6053// Sometimes, a raw constant is turned into an Id, and sometimes6054// a specialization constant expression is.6055spv::Id TGlslangToSpvTraverser::makeArraySizeId(const glslang::TArraySizes& arraySizes, int dim, bool allowZero, bool boolType)6056{6057// First, see if this is sized with a node, meaning a specialization constant:6058glslang::TIntermTyped* specNode = arraySizes.getDimNode(dim);6059if (specNode != nullptr) {6060builder.clearAccessChain();6061SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);6062spec_constant_op_mode_setter.turnOnSpecConstantOpMode();6063specNode->traverse(this);6064return accessChainLoad(specNode->getAsTyped()->getType());6065}60666067// Otherwise, need a compile-time (front end) size, get it:6068int size = arraySizes.getDimSize(dim);60696070if (!allowZero)6071assert(size > 0);60726073if (boolType) {6074return builder.makeBoolConstant(size);6075} else {6076return builder.makeUintConstant(size);6077}6078}60796080// Wrap the builder's accessChainLoad to:6081// - localize handling of RelaxedPrecision6082// - use the SPIR-V inferred type instead of another conversion of the glslang type6083// (avoids unnecessary work and possible type punning for structures)6084// - do conversion of concrete to abstract type6085spv::Id TGlslangToSpvTraverser::accessChainLoad(const glslang::TType& type)6086{6087spv::Id nominalTypeId = builder.accessChainGetInferredType();60886089spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;6090coherentFlags |= TranslateCoherent(type);60916092spv::MemoryAccessMask accessMask = spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) & ~spv::MemoryAccessMask::MakePointerAvailableKHR);6093// If the value being loaded is HelperInvocation, SPIR-V 1.6 is being generated (so that6094// SPV_EXT_demote_to_helper_invocation is in core) and the memory model is in use, add6095// the Volatile MemoryAccess semantic.6096if (type.getQualifier().builtIn == glslang::EbvHelperInvocation &&6097glslangIntermediate->usingVulkanMemoryModel() &&6098glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {6099accessMask = spv::MemoryAccessMask(accessMask | spv::MemoryAccessMask::Volatile);6100}61016102unsigned int alignment = builder.getAccessChain().alignment;6103alignment |= type.getBufferReferenceAlignment();61046105spv::Id loadedId = builder.accessChainLoad(TranslatePrecisionDecoration(type),6106TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags),6107TranslateNonUniformDecoration(type.getQualifier()),6108nominalTypeId,6109accessMask,6110TranslateMemoryScope(coherentFlags),6111alignment);61126113// Need to convert to abstract types when necessary6114if (type.getBasicType() == glslang::EbtBool) {6115loadedId = convertLoadedBoolInUniformToUint(type, nominalTypeId, loadedId);6116}61176118return loadedId;6119}61206121// Wrap the builder's accessChainStore to:6122// - do conversion of concrete to abstract type6123//6124// Implicitly uses the existing builder.accessChain as the storage target.6125void TGlslangToSpvTraverser::accessChainStore(const glslang::TType& type, spv::Id rvalue)6126{6127// Need to convert to abstract types when necessary6128if (type.getBasicType() == glslang::EbtBool) {6129spv::Id nominalTypeId = builder.accessChainGetInferredType();61306131if (builder.isScalarType(nominalTypeId)) {6132// Conversion for bool6133spv::Id boolType = builder.makeBoolType();6134if (nominalTypeId != boolType) {6135// keep these outside arguments, for determinant order-of-evaluation6136spv::Id one = builder.makeUintConstant(1);6137spv::Id zero = builder.makeUintConstant(0);6138rvalue = builder.createTriOp(spv::Op::OpSelect, nominalTypeId, rvalue, one, zero);6139} else if (builder.getTypeId(rvalue) != boolType)6140rvalue = builder.createBinOp(spv::Op::OpINotEqual, boolType, rvalue, builder.makeUintConstant(0));6141} else if (builder.isVectorType(nominalTypeId)) {6142// Conversion for bvec6143int vecSize = builder.getNumTypeComponents(nominalTypeId);6144spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);6145if (nominalTypeId != bvecType) {6146// keep these outside arguments, for determinant order-of-evaluation6147spv::Id one = makeSmearedConstant(builder.makeUintConstant(1), vecSize);6148spv::Id zero = makeSmearedConstant(builder.makeUintConstant(0), vecSize);6149rvalue = builder.createTriOp(spv::Op::OpSelect, nominalTypeId, rvalue, one, zero);6150} else if (builder.getTypeId(rvalue) != bvecType)6151rvalue = builder.createBinOp(spv::Op::OpINotEqual, bvecType, rvalue,6152makeSmearedConstant(builder.makeUintConstant(0), vecSize));6153}6154}61556156spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;6157coherentFlags |= TranslateCoherent(type);61586159unsigned int alignment = builder.getAccessChain().alignment;6160alignment |= type.getBufferReferenceAlignment();61616162builder.accessChainStore(rvalue, TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags),6163spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) &6164~spv::MemoryAccessMask::MakePointerVisibleKHR),6165TranslateMemoryScope(coherentFlags), alignment);6166}61676168// For storing when types match at the glslang level, but not might match at the6169// SPIR-V level.6170//6171// This especially happens when a single glslang type expands to multiple6172// SPIR-V types, like a struct that is used in a member-undecorated way as well6173// as in a member-decorated way.6174//6175// NOTE: This function can handle any store request; if it's not special it6176// simplifies to a simple OpStore.6177//6178// Implicitly uses the existing builder.accessChain as the storage target.6179void TGlslangToSpvTraverser::multiTypeStore(const glslang::TType& type, spv::Id rValue)6180{6181// we only do the complex path here if it's an aggregate6182if (! type.isStruct() && ! type.isArray()) {6183accessChainStore(type, rValue);6184return;6185}61866187// and, it has to be a case of type aliasing6188spv::Id rType = builder.getTypeId(rValue);6189spv::Id lValue = builder.accessChainGetLValue();6190spv::Id lType = builder.getContainedTypeId(builder.getTypeId(lValue));6191if (lType == rType) {6192accessChainStore(type, rValue);6193return;6194}61956196// Recursively (as needed) copy an aggregate type to a different aggregate type,6197// where the two types were the same type in GLSL. This requires member6198// by member copy, recursively.61996200// SPIR-V 1.4 added an instruction to do help do this.6201if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {6202// However, bool in uniform space is changed to int, so6203// OpCopyLogical does not work for that.6204// TODO: It would be more robust to do a full recursive verification of the types satisfying SPIR-V rules.6205bool rBool = builder.containsType(builder.getTypeId(rValue), spv::Op::OpTypeBool, 0);6206bool lBool = builder.containsType(lType, spv::Op::OpTypeBool, 0);6207if (lBool == rBool) {6208spv::Id logicalCopy = builder.createUnaryOp(spv::Op::OpCopyLogical, lType, rValue);6209accessChainStore(type, logicalCopy);6210return;6211}6212}62136214// If an array, copy element by element.6215if (type.isArray()) {6216glslang::TType glslangElementType(type, 0);6217spv::Id elementRType = builder.getContainedTypeId(rType);6218for (int index = 0; index < type.getOuterArraySize(); ++index) {6219// get the source member6220spv::Id elementRValue = builder.createCompositeExtract(rValue, elementRType, index);62216222// set up the target storage6223builder.clearAccessChain();6224builder.setAccessChainLValue(lValue);6225builder.accessChainPush(builder.makeIntConstant(index), TranslateCoherent(type),6226type.getBufferReferenceAlignment());62276228// store the member6229multiTypeStore(glslangElementType, elementRValue);6230}6231} else {6232assert(type.isStruct());62336234// loop over structure members6235const glslang::TTypeList& members = *type.getStruct();6236for (int m = 0; m < (int)members.size(); ++m) {6237const glslang::TType& glslangMemberType = *members[m].type;62386239// get the source member6240spv::Id memberRType = builder.getContainedTypeId(rType, m);6241spv::Id memberRValue = builder.createCompositeExtract(rValue, memberRType, m);62426243// set up the target storage6244builder.clearAccessChain();6245builder.setAccessChainLValue(lValue);6246builder.accessChainPush(builder.makeIntConstant(m), TranslateCoherent(type),6247type.getBufferReferenceAlignment());62486249// store the member6250multiTypeStore(glslangMemberType, memberRValue);6251}6252}6253}62546255// Decide whether or not this type should be6256// decorated with offsets and strides, and if so6257// whether std140 or std430 rules should be applied.6258glslang::TLayoutPacking TGlslangToSpvTraverser::getExplicitLayout(const glslang::TType& type) const6259{6260// has to be a block6261if (type.getBasicType() != glslang::EbtBlock)6262return glslang::ElpNone;62636264// has to be a uniform or buffer block or task in/out blocks6265if (type.getQualifier().storage != glslang::EvqUniform &&6266type.getQualifier().storage != glslang::EvqBuffer &&6267type.getQualifier().storage != glslang::EvqShared &&6268!type.getQualifier().isTaskMemory())6269return glslang::ElpNone;62706271// return the layout to use6272switch (type.getQualifier().layoutPacking) {6273case glslang::ElpStd140:6274case glslang::ElpStd430:6275case glslang::ElpScalar:6276return type.getQualifier().layoutPacking;6277default:6278return glslang::ElpNone;6279}6280}62816282// Given an array type, returns the integer stride required for that array6283int TGlslangToSpvTraverser::getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking explicitLayout,6284glslang::TLayoutMatrix matrixLayout)6285{6286int size;6287int stride;6288glslangIntermediate->getMemberAlignment(arrayType, size, stride, explicitLayout,6289matrixLayout == glslang::ElmRowMajor);62906291return stride;6292}62936294// Given a matrix type, or array (of array) of matrixes type, returns the integer stride required for that matrix6295// when used as a member of an interface block6296int TGlslangToSpvTraverser::getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking explicitLayout,6297glslang::TLayoutMatrix matrixLayout)6298{6299glslang::TType elementType;6300elementType.shallowCopy(matrixType);6301elementType.clearArraySizes();63026303int size;6304int stride;6305glslangIntermediate->getMemberAlignment(elementType, size, stride, explicitLayout,6306matrixLayout == glslang::ElmRowMajor);63076308return stride;6309}63106311// Given a member type of a struct, realign the current offset for it, and compute6312// the next (not yet aligned) offset for the next member, which will get aligned6313// on the next call.6314// 'currentOffset' should be passed in already initialized, ready to modify, and reflecting6315// the migration of data from nextOffset -> currentOffset. It should be -1 on the first call.6316// -1 means a non-forced member offset (no decoration needed).6317void TGlslangToSpvTraverser::updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType,6318int& currentOffset, int& nextOffset, glslang::TLayoutPacking explicitLayout, glslang::TLayoutMatrix matrixLayout)6319{6320// this will get a positive value when deemed necessary6321nextOffset = -1;63226323// override anything in currentOffset with user-set offset6324if (memberType.getQualifier().hasOffset())6325currentOffset = memberType.getQualifier().layoutOffset;63266327// It could be that current linker usage in glslang updated all the layoutOffset,6328// in which case the following code does not matter. But, that's not quite right6329// once cross-compilation unit GLSL validation is done, as the original user6330// settings are needed in layoutOffset, and then the following will come into play.63316332if (explicitLayout == glslang::ElpNone) {6333if (! memberType.getQualifier().hasOffset())6334currentOffset = -1;63356336return;6337}63386339// Getting this far means we need explicit offsets6340if (currentOffset < 0)6341currentOffset = 0;63426343// Now, currentOffset is valid (either 0, or from a previous nextOffset),6344// but possibly not yet correctly aligned.63456346int memberSize;6347int dummyStride;6348int memberAlignment = glslangIntermediate->getMemberAlignment(memberType, memberSize, dummyStride, explicitLayout,6349matrixLayout == glslang::ElmRowMajor);63506351bool isVectorLike = memberType.isVector();6352if (memberType.isMatrix()) {6353if (matrixLayout == glslang::ElmRowMajor)6354isVectorLike = memberType.getMatrixRows() == 1;6355else6356isVectorLike = memberType.getMatrixCols() == 1;6357}63586359// Adjust alignment for HLSL rules6360// TODO: make this consistent in early phases of code:6361// adjusting this late means inconsistencies with earlier code, which for reflection is an issue6362// Until reflection is brought in sync with these adjustments, don't apply to $Global,6363// which is the most likely to rely on reflection, and least likely to rely implicit layouts6364if (glslangIntermediate->usingHlslOffsets() &&6365! memberType.isStruct() && structType.getTypeName().compare("$Global") != 0) {6366int componentSize;6367int componentAlignment = glslangIntermediate->getBaseAlignmentScalar(memberType, componentSize);6368if (! memberType.isArray() && isVectorLike && componentAlignment <= 4)6369memberAlignment = componentAlignment;63706371// Don't add unnecessary padding after this member6372// (undo std140 bumping size to a mutliple of vec4)6373if (explicitLayout == glslang::ElpStd140) {6374if (memberType.isMatrix()) {6375if (matrixLayout == glslang::ElmRowMajor)6376memberSize -= componentSize * (4 - memberType.getMatrixCols());6377else6378memberSize -= componentSize * (4 - memberType.getMatrixRows());6379} else if (memberType.isArray())6380memberSize -= componentSize * (4 - memberType.getVectorSize());6381}6382}63836384// Bump up to member alignment6385glslang::RoundToPow2(currentOffset, memberAlignment);63866387// Bump up to vec4 if there is a bad straddle6388if (explicitLayout != glslang::ElpScalar && glslangIntermediate->improperStraddle(memberType, memberSize,6389currentOffset, isVectorLike))6390glslang::RoundToPow2(currentOffset, 16);63916392nextOffset = currentOffset + memberSize;6393}63946395void TGlslangToSpvTraverser::declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember)6396{6397const glslang::TBuiltInVariable glslangBuiltIn = members[glslangMember].type->getQualifier().builtIn;6398switch (glslangBuiltIn)6399{6400case glslang::EbvPointSize:6401case glslang::EbvClipDistance:6402case glslang::EbvCullDistance:6403case glslang::EbvViewportMaskNV:6404case glslang::EbvSecondaryPositionNV:6405case glslang::EbvSecondaryViewportMaskNV:6406case glslang::EbvPositionPerViewNV:6407case glslang::EbvViewportMaskPerViewNV:6408case glslang::EbvTaskCountNV:6409case glslang::EbvPrimitiveCountNV:6410case glslang::EbvPrimitiveIndicesNV:6411case glslang::EbvClipDistancePerViewNV:6412case glslang::EbvCullDistancePerViewNV:6413case glslang::EbvLayerPerViewNV:6414case glslang::EbvMeshViewCountNV:6415case glslang::EbvMeshViewIndicesNV:6416// Generate the associated capability. Delegate to TranslateBuiltInDecoration.6417// Alternately, we could just call this for any glslang built-in, since the6418// capability already guards against duplicates.6419TranslateBuiltInDecoration(glslangBuiltIn, false);6420break;6421default:6422// Capabilities were already generated when the struct was declared.6423break;6424}6425}64266427bool TGlslangToSpvTraverser::isShaderEntryPoint(const glslang::TIntermAggregate* node)6428{6429return node->getName().compare(glslangIntermediate->getEntryPointMangledName().c_str()) == 0;6430}64316432// Does parameter need a place to keep writes, separate from the original?6433// Assumes called after originalParam(), which filters out block/buffer/opaque-based6434// qualifiers such that we should have only in/out/inout/constreadonly here.6435bool TGlslangToSpvTraverser::writableParam(glslang::TStorageQualifier qualifier) const6436{6437assert(qualifier == glslang::EvqIn ||6438qualifier == glslang::EvqOut ||6439qualifier == glslang::EvqInOut ||6440qualifier == glslang::EvqUniform ||6441qualifier == glslang::EvqConstReadOnly);6442return qualifier != glslang::EvqConstReadOnly &&6443qualifier != glslang::EvqUniform;6444}64456446// Is parameter pass-by-original?6447bool TGlslangToSpvTraverser::originalParam(glslang::TStorageQualifier qualifier, const glslang::TType& paramType,6448bool implicitThisParam)6449{6450if (implicitThisParam) // implicit this6451return true;6452if (glslangIntermediate->getSource() == glslang::EShSourceHlsl)6453return paramType.getBasicType() == glslang::EbtBlock;6454return (paramType.containsOpaque() && !glslangIntermediate->getBindlessMode()) || // sampler, etc.6455paramType.getQualifier().isSpirvByReference() || // spirv_by_reference6456(paramType.getBasicType() == glslang::EbtBlock && qualifier == glslang::EvqBuffer); // SSBO6457}64586459// Make all the functions, skeletally, without actually visiting their bodies.6460void TGlslangToSpvTraverser::makeFunctions(const glslang::TIntermSequence& glslFunctions)6461{6462const auto getParamDecorations = [&](std::vector<spv::Decoration>& decorations, const glslang::TType& type,6463bool useVulkanMemoryModel) {6464spv::Decoration paramPrecision = TranslatePrecisionDecoration(type);6465if (paramPrecision != spv::NoPrecision)6466decorations.push_back(paramPrecision);6467TranslateMemoryDecoration(type.getQualifier(), decorations, useVulkanMemoryModel);6468if (type.isReference()) {6469// Original and non-writable params pass the pointer directly and6470// use restrict/aliased, others are stored to a pointer in Function6471// memory and use RestrictPointer/AliasedPointer.6472if (originalParam(type.getQualifier().storage, type, false) ||6473!writableParam(type.getQualifier().storage)) {6474// TranslateMemoryDecoration added Restrict decoration already.6475if (!type.getQualifier().isRestrict()) {6476decorations.push_back(spv::Decoration::Aliased);6477}6478} else {6479decorations.push_back(type.getQualifier().isRestrict() ? spv::Decoration::RestrictPointerEXT :6480spv::Decoration::AliasedPointerEXT);6481}6482}6483};64846485for (int f = 0; f < (int)glslFunctions.size(); ++f) {6486glslang::TIntermAggregate* glslFunction = glslFunctions[f]->getAsAggregate();6487if (! glslFunction || glslFunction->getOp() != glslang::EOpFunction)6488continue;64896490builder.setDebugSourceLocation(glslFunction->getLoc().line, glslFunction->getLoc().getFilename());64916492if (isShaderEntryPoint(glslFunction)) {6493// For HLSL, the entry function is actually a compiler generated function to resolve the difference of6494// entry function signature between HLSL and SPIR-V. So we don't emit debug information for that.6495if (glslangIntermediate->getSource() != glslang::EShSourceHlsl) {6496builder.setupFunctionDebugInfo(shaderEntry, glslangIntermediate->getEntryPointMangledName().c_str(),6497std::vector<spv::Id>(), // main function has no param6498std::vector<char const*>());6499}6500continue;6501}6502// We're on a user function. Set up the basic interface for the function now,6503// so that it's available to call. Translating the body will happen later.6504//6505// Typically (except for a "const in" parameter), an address will be passed to the6506// function. What it is an address of varies:6507//6508// - "in" parameters not marked as "const" can be written to without modifying the calling6509// argument so that write needs to be to a copy, hence the address of a copy works.6510//6511// - "const in" parameters can just be the r-value, as no writes need occur.6512//6513// - "out" and "inout" arguments can't be done as pointers to the calling argument, because6514// GLSL has copy-in/copy-out semantics. They can be handled though with a pointer to a copy.65156516std::vector<spv::Id> paramTypes;6517std::vector<char const*> paramNames;6518std::vector<std::vector<spv::Decoration>> paramDecorations; // list of decorations per parameter6519glslang::TIntermSequence& parameters = glslFunction->getSequence()[0]->getAsAggregate()->getSequence();65206521#ifdef ENABLE_HLSL6522bool implicitThis = (int)parameters.size() > 0 && parameters[0]->getAsSymbolNode()->getName() ==6523glslangIntermediate->implicitThisName;6524#else6525bool implicitThis = false;6526#endif65276528paramDecorations.resize(parameters.size());6529for (int p = 0; p < (int)parameters.size(); ++p) {6530const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();6531spv::Id typeId = convertGlslangToSpvType(paramType);6532if (originalParam(paramType.getQualifier().storage, paramType, implicitThis && p == 0))6533typeId = builder.makePointer(TranslateStorageClass(paramType), typeId);6534else if (writableParam(paramType.getQualifier().storage))6535typeId = builder.makePointer(spv::StorageClass::Function, typeId);6536else6537rValueParameters.insert(parameters[p]->getAsSymbolNode()->getId());6538getParamDecorations(paramDecorations[p], paramType, glslangIntermediate->usingVulkanMemoryModel());6539paramTypes.push_back(typeId);6540}65416542for (auto const parameter:parameters) {6543paramNames.push_back(parameter->getAsSymbolNode()->getName().c_str());6544}65456546spv::Block* functionBlock;6547spv::Function* function = builder.makeFunctionEntry(6548TranslatePrecisionDecoration(glslFunction->getType()), convertGlslangToSpvType(glslFunction->getType()),6549glslFunction->getName().c_str(), convertGlslangLinkageToSpv(glslFunction->getLinkType()), paramTypes,6550paramDecorations, &functionBlock);6551builder.setupFunctionDebugInfo(function, glslFunction->getName().c_str(), paramTypes, paramNames);6552if (implicitThis)6553function->setImplicitThis();65546555// Track function to emit/call later6556functionMap[glslFunction->getName().c_str()] = function;65576558// Set the parameter id's6559for (int p = 0; p < (int)parameters.size(); ++p) {6560symbolValues[parameters[p]->getAsSymbolNode()->getId()] = function->getParamId(p);6561// give a name too6562builder.addName(function->getParamId(p), parameters[p]->getAsSymbolNode()->getName().c_str());65636564const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();6565if (paramType.contains8BitInt())6566builder.addCapability(spv::Capability::Int8);6567if (paramType.contains16BitInt())6568builder.addCapability(spv::Capability::Int16);6569if (paramType.contains16BitFloat())6570builder.addCapability(spv::Capability::Float16);6571}6572}6573}65746575// Process all the initializers, while skipping the functions and link objects6576void TGlslangToSpvTraverser::makeGlobalInitializers(const glslang::TIntermSequence& initializers)6577{6578builder.setBuildPoint(shaderEntry->getLastBlock());6579for (int i = 0; i < (int)initializers.size(); ++i) {6580glslang::TIntermAggregate* initializer = initializers[i]->getAsAggregate();6581if (initializer && initializer->getOp() != glslang::EOpFunction && initializer->getOp() !=6582glslang::EOpLinkerObjects) {65836584// We're on a top-level node that's not a function. Treat as an initializer, whose6585// code goes into the beginning of the entry point.6586initializer->traverse(this);6587}6588}6589}6590// Walk over all linker objects to create a map for payload and callable data linker objects6591// and their location to be used during codegen for OpTraceKHR and OpExecuteCallableKHR6592// This is done here since it is possible that these linker objects are not be referenced in the AST6593void TGlslangToSpvTraverser::collectRayTracingLinkerObjects()6594{6595glslang::TIntermAggregate* linkerObjects = glslangIntermediate->findLinkerObjects();6596for (auto& objSeq : linkerObjects->getSequence()) {6597auto objNode = objSeq->getAsSymbolNode();6598if (objNode != nullptr) {6599if (objNode->getQualifier().hasLocation()) {6600unsigned int location = objNode->getQualifier().layoutLocation;6601auto st = objNode->getQualifier().storage;6602int set;6603switch (st)6604{6605case glslang::EvqPayload:6606case glslang::EvqPayloadIn:6607set = 0;6608break;6609case glslang::EvqCallableData:6610case glslang::EvqCallableDataIn:6611set = 1;6612break;66136614case glslang::EvqHitObjectAttrNV:6615case glslang::EvqHitObjectAttrEXT:6616set = 2;6617break;66186619default:6620set = -1;6621}6622if (set != -1)6623locationToSymbol[set].insert(std::make_pair(location, objNode));6624}6625}6626}6627}6628// Process all the functions, while skipping initializers.6629void TGlslangToSpvTraverser::visitFunctions(const glslang::TIntermSequence& glslFunctions)6630{6631for (int f = 0; f < (int)glslFunctions.size(); ++f) {6632glslang::TIntermAggregate* node = glslFunctions[f]->getAsAggregate();6633if (node && (node->getOp() == glslang::EOpFunction || node->getOp() == glslang::EOpLinkerObjects))6634node->traverse(this);6635}6636}66376638void TGlslangToSpvTraverser::translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments,6639spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags)6640{6641const glslang::TIntermSequence& glslangArguments = node.getSequence();66426643glslang::TSampler sampler = {};6644bool cubeCompare = false;6645bool f16ShadowCompare = false;6646if (node.isTexture() || node.isImage()) {6647sampler = glslangArguments[0]->getAsTyped()->getType().getSampler();6648cubeCompare = sampler.dim == glslang::EsdCube && sampler.arrayed && sampler.shadow;6649f16ShadowCompare = sampler.shadow &&6650glslangArguments[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16;6651}66526653for (int i = 0; i < (int)glslangArguments.size(); ++i) {6654builder.clearAccessChain();6655glslangArguments[i]->traverse(this);66566657// Special case l-value operands6658bool lvalue = false;6659switch (node.getOp()) {6660case glslang::EOpImageAtomicAdd:6661case glslang::EOpImageAtomicMin:6662case glslang::EOpImageAtomicMax:6663case glslang::EOpImageAtomicAnd:6664case glslang::EOpImageAtomicOr:6665case glslang::EOpImageAtomicXor:6666case glslang::EOpImageAtomicExchange:6667case glslang::EOpImageAtomicCompSwap:6668case glslang::EOpImageAtomicLoad:6669case glslang::EOpImageAtomicStore:6670if (i == 0)6671lvalue = true;6672break;6673case glslang::EOpSparseImageLoad:6674if ((sampler.ms && i == 3) || (! sampler.ms && i == 2))6675lvalue = true;6676break;6677case glslang::EOpSparseTexture:6678if (((cubeCompare || f16ShadowCompare) && i == 3) || (! (cubeCompare || f16ShadowCompare) && i == 2))6679lvalue = true;6680break;6681case glslang::EOpSparseTextureClamp:6682if (((cubeCompare || f16ShadowCompare) && i == 4) || (! (cubeCompare || f16ShadowCompare) && i == 3))6683lvalue = true;6684break;6685case glslang::EOpSparseTextureLod:6686case glslang::EOpSparseTextureOffset:6687if ((f16ShadowCompare && i == 4) || (! f16ShadowCompare && i == 3))6688lvalue = true;6689break;6690case glslang::EOpSparseTextureFetch:6691if ((sampler.dim != glslang::EsdRect && i == 3) || (sampler.dim == glslang::EsdRect && i == 2))6692lvalue = true;6693break;6694case glslang::EOpSparseTextureFetchOffset:6695if ((sampler.dim != glslang::EsdRect && i == 4) || (sampler.dim == glslang::EsdRect && i == 3))6696lvalue = true;6697break;6698case glslang::EOpSparseTextureLodOffset:6699case glslang::EOpSparseTextureGrad:6700case glslang::EOpSparseTextureOffsetClamp:6701if ((f16ShadowCompare && i == 5) || (! f16ShadowCompare && i == 4))6702lvalue = true;6703break;6704case glslang::EOpSparseTextureGradOffset:6705case glslang::EOpSparseTextureGradClamp:6706if ((f16ShadowCompare && i == 6) || (! f16ShadowCompare && i == 5))6707lvalue = true;6708break;6709case glslang::EOpSparseTextureGradOffsetClamp:6710if ((f16ShadowCompare && i == 7) || (! f16ShadowCompare && i == 6))6711lvalue = true;6712break;6713case glslang::EOpSparseTextureGather:6714if ((sampler.shadow && i == 3) || (! sampler.shadow && i == 2))6715lvalue = true;6716break;6717case glslang::EOpSparseTextureGatherOffset:6718case glslang::EOpSparseTextureGatherOffsets:6719if ((sampler.shadow && i == 4) || (! sampler.shadow && i == 3))6720lvalue = true;6721break;6722case glslang::EOpSparseTextureGatherLod:6723if (i == 3)6724lvalue = true;6725break;6726case glslang::EOpSparseTextureGatherLodOffset:6727case glslang::EOpSparseTextureGatherLodOffsets:6728if (i == 4)6729lvalue = true;6730break;6731case glslang::EOpSparseImageLoadLod:6732if (i == 3)6733lvalue = true;6734break;6735case glslang::EOpImageSampleFootprintNV:6736if (i == 4)6737lvalue = true;6738break;6739case glslang::EOpImageSampleFootprintClampNV:6740case glslang::EOpImageSampleFootprintLodNV:6741if (i == 5)6742lvalue = true;6743break;6744case glslang::EOpImageSampleFootprintGradNV:6745if (i == 6)6746lvalue = true;6747break;6748case glslang::EOpImageSampleFootprintGradClampNV:6749if (i == 7)6750lvalue = true;6751break;6752case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:6753case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:6754case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:6755if (i == 2)6756lvalue = true;6757break;6758case glslang::EOpConstructSaturated:6759if (i == 0)6760lvalue = true;6761break;6762default:6763break;6764}67656766if (lvalue) {6767spv::Id lvalue_id = builder.accessChainGetLValue();6768arguments.push_back(lvalue_id);6769lvalueCoherentFlags = builder.getAccessChain().coherentFlags;6770builder.addDecoration(lvalue_id, TranslateNonUniformDecoration(lvalueCoherentFlags));6771lvalueCoherentFlags |= TranslateCoherent(glslangArguments[i]->getAsTyped()->getType());6772} else {6773if (i > 0 &&6774glslangArguments[i]->getAsSymbolNode() && glslangArguments[i-1]->getAsSymbolNode() &&6775glslangArguments[i]->getAsSymbolNode()->getId() == glslangArguments[i-1]->getAsSymbolNode()->getId()) {6776// Reuse the id if possible6777arguments.push_back(arguments[i-1]);6778} else {6779arguments.push_back(accessChainLoad(glslangArguments[i]->getAsTyped()->getType()));6780}6781}6782}6783}67846785void TGlslangToSpvTraverser::translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments)6786{6787builder.clearAccessChain();6788node.getOperand()->traverse(this);6789arguments.push_back(accessChainLoad(node.getOperand()->getType()));6790}67916792spv::Id TGlslangToSpvTraverser::createImageTextureFunctionCall(glslang::TIntermOperator* node)6793{6794if (! node->isImage() && ! node->isTexture())6795return spv::NoResult;67966797builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());67986799// Process a GLSL texturing op (will be SPV image)68006801const glslang::TType &imageType = node->getAsAggregate()6802? node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType()6803: node->getAsUnaryNode()->getOperand()->getAsTyped()->getType();6804const glslang::TSampler sampler = imageType.getSampler();6805bool f16ShadowCompare = (sampler.shadow && node->getAsAggregate())6806? node->getAsAggregate()->getSequence()[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat166807: false;68086809const auto signExtensionMask = [&]() {6810if (builder.getSpvVersion() >= spv::Spv_1_4) {6811if (sampler.type == glslang::EbtUint)6812return spv::ImageOperandsMask::ZeroExtend;6813else if (sampler.type == glslang::EbtInt)6814return spv::ImageOperandsMask::SignExtend;6815}6816return spv::ImageOperandsMask::MaskNone;6817};68186819spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;68206821std::vector<spv::Id> arguments;6822if (node->getAsAggregate())6823translateArguments(*node->getAsAggregate(), arguments, lvalueCoherentFlags);6824else6825translateArguments(*node->getAsUnaryNode(), arguments);6826spv::Decoration precision = TranslatePrecisionDecoration(node->getType());68276828spv::Builder::TextureParameters params = { };6829params.sampler = arguments[0];68306831glslang::TCrackedTextureOp cracked;6832node->crackTexture(sampler, cracked);68336834const bool isUnsignedResult = node->getType().getBasicType() == glslang::EbtUint;68356836if (builder.isSampledImage(params.sampler) &&6837((cracked.query && node->getOp() != glslang::EOpTextureQueryLod) || cracked.fragMask || cracked.fetch)) {6838params.sampler = builder.createUnaryOp(spv::Op::OpImage, builder.getImageType(params.sampler), params.sampler);6839if (imageType.getQualifier().isNonUniform()) {6840builder.addDecoration(params.sampler, spv::Decoration::NonUniformEXT);6841}6842}6843// Check for queries6844if (cracked.query) {6845switch (node->getOp()) {6846case glslang::EOpImageQuerySize:6847case glslang::EOpTextureQuerySize:6848if (arguments.size() > 1) {6849params.lod = arguments[1];6850return builder.createTextureQueryCall(spv::Op::OpImageQuerySizeLod, params, isUnsignedResult);6851} else6852return builder.createTextureQueryCall(spv::Op::OpImageQuerySize, params, isUnsignedResult);6853case glslang::EOpImageQuerySamples:6854case glslang::EOpTextureQuerySamples:6855return builder.createTextureQueryCall(spv::Op::OpImageQuerySamples, params, isUnsignedResult);6856case glslang::EOpTextureQueryLod:6857params.coords = arguments[1];6858return builder.createTextureQueryCall(spv::Op::OpImageQueryLod, params, isUnsignedResult);6859case glslang::EOpTextureQueryLevels:6860return builder.createTextureQueryCall(spv::Op::OpImageQueryLevels, params, isUnsignedResult);6861case glslang::EOpSparseTexelsResident:6862return builder.createUnaryOp(spv::Op::OpImageSparseTexelsResident, builder.makeBoolType(), arguments[0]);6863default:6864assert(0);6865break;6866}6867}68686869int components = node->getType().getVectorSize();68706871if (node->getOp() == glslang::EOpImageLoad ||6872node->getOp() == glslang::EOpImageLoadLod ||6873node->getOp() == glslang::EOpTextureFetch ||6874node->getOp() == glslang::EOpTextureFetchOffset) {6875// These must produce 4 components, per SPIR-V spec. We'll add a conversion constructor if needed.6876// This will only happen through the HLSL path for operator[], so we do not have to handle e.g.6877// the EOpTexture/Proj/Lod/etc family. It would be harmless to do so, but would need more logic6878// here around e.g. which ones return scalars or other types.6879components = 4;6880}68816882glslang::TType returnType(node->getType().getBasicType(), glslang::EvqTemporary, components);68836884auto resultType = [&returnType,this]{ return convertGlslangToSpvType(returnType); };68856886// Check for image functions other than queries6887if (node->isImage()) {6888std::vector<spv::IdImmediate> operands;6889auto opIt = arguments.begin();6890spv::IdImmediate image = { true, *(opIt++) };6891operands.push_back(image);68926893// Handle subpass operations6894// TODO: GLSL should change to have the "MS" only on the type rather than the6895// built-in function.6896if (cracked.subpass) {6897// add on the (0,0) coordinate6898spv::Id zero = builder.makeIntConstant(0);6899std::vector<spv::Id> comps;6900comps.push_back(zero);6901comps.push_back(zero);6902spv::IdImmediate coord = { true,6903builder.makeCompositeConstant(builder.makeVectorType(builder.makeIntType(32), 2), comps) };6904operands.push_back(coord);6905spv::IdImmediate imageOperands = { false, spv::ImageOperandsMask::MaskNone };6906imageOperands.word = imageOperands.word | (unsigned)signExtensionMask();6907if (sampler.isMultiSample()) {6908imageOperands.word = imageOperands.word | (unsigned)spv::ImageOperandsMask::Sample;6909}6910if (imageOperands.word != (unsigned)spv::ImageOperandsMask::MaskNone) {6911operands.push_back(imageOperands);6912if (sampler.isMultiSample()) {6913spv::IdImmediate imageOperand = { true, *(opIt++) };6914operands.push_back(imageOperand);6915}6916}6917spv::Id result = builder.createOp(spv::Op::OpImageRead, resultType(), operands);6918builder.setPrecision(result, precision);6919return result;6920}69216922if (cracked.attachmentEXT) {6923if (opIt != arguments.end()) {6924spv::IdImmediate sample = { true, *opIt };6925operands.push_back(sample);6926}6927spv::Id result = builder.createOp(spv::Op::OpColorAttachmentReadEXT, resultType(), operands);6928builder.addExtension(spv::E_SPV_EXT_shader_tile_image);6929builder.setPrecision(result, precision);6930return result;6931}69326933spv::IdImmediate coord = { true, *(opIt++) };6934operands.push_back(coord);6935if (node->getOp() == glslang::EOpImageLoad || node->getOp() == glslang::EOpImageLoadLod) {6936spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;6937if (sampler.isMultiSample()) {6938mask = mask | spv::ImageOperandsMask::Sample;6939}6940if (cracked.lod) {6941builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);6942builder.addCapability(spv::Capability::ImageReadWriteLodAMD);6943mask = mask | spv::ImageOperandsMask::Lod;6944}6945mask = mask | TranslateImageOperands(TranslateCoherent(imageType));6946mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelAvailableKHR);6947mask = mask | signExtensionMask();6948if (mask != spv::ImageOperandsMask::MaskNone) {6949spv::IdImmediate imageOperands = { false, (unsigned int)mask };6950operands.push_back(imageOperands);6951}6952if (anySet(mask, spv::ImageOperandsMask::Sample)) {6953spv::IdImmediate imageOperand = { true, *opIt++ };6954operands.push_back(imageOperand);6955}6956if (anySet(mask, spv::ImageOperandsMask::Lod)) {6957spv::IdImmediate imageOperand = { true, *opIt++ };6958operands.push_back(imageOperand);6959}6960if (anySet(mask, spv::ImageOperandsMask::MakeTexelVisibleKHR)) {6961spv::IdImmediate imageOperand = { true,6962builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };6963operands.push_back(imageOperand);6964}69656966if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)6967builder.addCapability(spv::Capability::StorageImageReadWithoutFormat);69686969std::vector<spv::Id> result(1, builder.createOp(spv::Op::OpImageRead, resultType(), operands));6970builder.setPrecision(result[0], precision);69716972// If needed, add a conversion constructor to the proper size.6973if (components != node->getType().getVectorSize())6974result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));69756976return result[0];6977} else if (node->getOp() == glslang::EOpImageStore || node->getOp() == glslang::EOpImageStoreLod) {69786979// Push the texel value before the operands6980if (sampler.isMultiSample() || cracked.lod) {6981spv::IdImmediate texel = { true, *(opIt + 1) };6982operands.push_back(texel);6983} else {6984spv::IdImmediate texel = { true, *opIt };6985operands.push_back(texel);6986}69876988spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;6989if (sampler.isMultiSample()) {6990mask = mask | spv::ImageOperandsMask::Sample;6991}6992if (cracked.lod) {6993builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);6994builder.addCapability(spv::Capability::ImageReadWriteLodAMD);6995mask = mask | spv::ImageOperandsMask::Lod;6996}6997mask = mask | TranslateImageOperands(TranslateCoherent(imageType));6998mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelVisibleKHR);6999mask = mask | signExtensionMask();7000if (mask != spv::ImageOperandsMask::MaskNone) {7001spv::IdImmediate imageOperands = { false, (unsigned int)mask };7002operands.push_back(imageOperands);7003}7004if (anySet(mask, spv::ImageOperandsMask::Sample)) {7005spv::IdImmediate imageOperand = { true, *opIt++ };7006operands.push_back(imageOperand);7007}7008if (anySet(mask, spv::ImageOperandsMask::Lod)) {7009spv::IdImmediate imageOperand = { true, *opIt++ };7010operands.push_back(imageOperand);7011}7012if (anySet(mask, spv::ImageOperandsMask::MakeTexelAvailableKHR)) {7013spv::IdImmediate imageOperand = { true,7014builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };7015operands.push_back(imageOperand);7016}70177018builder.createNoResultOp(spv::Op::OpImageWrite, operands);7019if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)7020builder.addCapability(spv::Capability::StorageImageWriteWithoutFormat);7021return spv::NoResult;7022} else if (node->getOp() == glslang::EOpSparseImageLoad ||7023node->getOp() == glslang::EOpSparseImageLoadLod) {7024builder.addCapability(spv::Capability::SparseResidency);7025if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)7026builder.addCapability(spv::Capability::StorageImageReadWithoutFormat);70277028spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;7029if (sampler.isMultiSample()) {7030mask = mask | spv::ImageOperandsMask::Sample;7031}7032if (cracked.lod) {7033builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);7034builder.addCapability(spv::Capability::ImageReadWriteLodAMD);70357036mask = mask | spv::ImageOperandsMask::Lod;7037}7038mask = mask | TranslateImageOperands(TranslateCoherent(imageType));7039mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelAvailableKHR);7040mask = mask | signExtensionMask();7041if (mask != spv::ImageOperandsMask::MaskNone) {7042spv::IdImmediate imageOperands = { false, (unsigned int)mask };7043operands.push_back(imageOperands);7044}7045if (anySet(mask, spv::ImageOperandsMask::Sample)) {7046spv::IdImmediate imageOperand = { true, *opIt++ };7047operands.push_back(imageOperand);7048}7049if (anySet(mask, spv::ImageOperandsMask::Lod)) {7050spv::IdImmediate imageOperand = { true, *opIt++ };7051operands.push_back(imageOperand);7052}7053if (anySet(mask, spv::ImageOperandsMask::MakeTexelVisibleKHR)) {7054spv::IdImmediate imageOperand = { true, builder.makeUintConstant(TranslateMemoryScope(7055TranslateCoherent(imageType))) };7056operands.push_back(imageOperand);7057}70587059// Create the return type that was a special structure7060spv::Id texelOut = *opIt;7061spv::Id typeId0 = resultType();7062spv::Id typeId1 = builder.getDerefTypeId(texelOut);7063spv::Id resultTypeId = builder.makeStructResultType(typeId0, typeId1);70647065spv::Id resultId = builder.createOp(spv::Op::OpImageSparseRead, resultTypeId, operands);70667067// Decode the return type7068builder.createStore(builder.createCompositeExtract(resultId, typeId1, 1), texelOut);7069return builder.createCompositeExtract(resultId, typeId0, 0);7070} else {7071// Process image atomic operations70727073// GLSL "IMAGE_PARAMS" will involve in constructing an image texel pointer and this pointer,7074// as the first source operand, is required by SPIR-V atomic operations.7075// For non-MS, the sample value should be 07076spv::IdImmediate sample = { true, sampler.isMultiSample() ? *(opIt++) : builder.makeUintConstant(0) };7077operands.push_back(sample);70787079spv::Id resultTypeId;7080glslang::TBasicType typeProxy = node->getBasicType();7081// imageAtomicStore has a void return type so base the pointer type on7082// the type of the value operand.7083if (node->getOp() == glslang::EOpImageAtomicStore) {7084resultTypeId = builder.makePointer(spv::StorageClass::Image, builder.getTypeId(*opIt));7085typeProxy = node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType().getSampler().type;7086} else {7087resultTypeId = builder.makePointer(spv::StorageClass::Image, resultType());7088}7089spv::Id pointer = builder.createOp(spv::Op::OpImageTexelPointer, resultTypeId, operands);7090if (imageType.getQualifier().nonUniform) {7091builder.addDecoration(pointer, spv::Decoration::NonUniformEXT);7092}70937094std::vector<spv::Id> operands;7095operands.push_back(pointer);7096for (; opIt != arguments.end(); ++opIt)7097operands.push_back(*opIt);70987099return createAtomicOperation(node->getOp(), precision, resultType(), operands, typeProxy,7100lvalueCoherentFlags, node->getType());7101}7102}71037104// Check for fragment mask functions other than queries7105if (cracked.fragMask) {7106assert(sampler.ms);71077108auto opIt = arguments.begin();7109std::vector<spv::Id> operands;71107111operands.push_back(params.sampler);7112++opIt;71137114if (sampler.isSubpass()) {7115// add on the (0,0) coordinate7116spv::Id zero = builder.makeIntConstant(0);7117std::vector<spv::Id> comps;7118comps.push_back(zero);7119comps.push_back(zero);7120operands.push_back(builder.makeCompositeConstant(7121builder.makeVectorType(builder.makeIntType(32), 2), comps));7122}71237124for (; opIt != arguments.end(); ++opIt)7125operands.push_back(*opIt);71267127spv::Op fragMaskOp = spv::Op::OpNop;7128if (node->getOp() == glslang::EOpFragmentMaskFetch)7129fragMaskOp = spv::Op::OpFragmentMaskFetchAMD;7130else if (node->getOp() == glslang::EOpFragmentFetch)7131fragMaskOp = spv::Op::OpFragmentFetchAMD;71327133builder.addExtension(spv::E_SPV_AMD_shader_fragment_mask);7134builder.addCapability(spv::Capability::FragmentMaskAMD);7135return builder.createOp(fragMaskOp, resultType(), operands);7136}71377138// Check for texture functions other than queries7139bool sparse = node->isSparseTexture();7140bool imageFootprint = node->isImageFootprint();7141bool cubeCompare = sampler.dim == glslang::EsdCube && sampler.isArrayed() && sampler.isShadow();71427143// check for bias argument7144bool bias = false;7145if (! cracked.lod && ! cracked.grad && ! cracked.fetch && ! cubeCompare) {7146int nonBiasArgCount = 2;7147if (cracked.gather)7148++nonBiasArgCount; // comp argument should be present when bias argument is present71497150if (f16ShadowCompare)7151++nonBiasArgCount;7152if (cracked.offset)7153++nonBiasArgCount;7154else if (cracked.offsets)7155++nonBiasArgCount;7156if (cracked.grad)7157nonBiasArgCount += 2;7158if (cracked.lodClamp)7159++nonBiasArgCount;7160if (sparse)7161++nonBiasArgCount;7162if (imageFootprint)7163//Following three extra arguments7164// int granularity, bool coarse, out gl_TextureFootprint2DNV footprint7165nonBiasArgCount += 3;7166if ((int)arguments.size() > nonBiasArgCount)7167bias = true;7168}71697170if (cracked.gather) {7171const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();7172if (bias || cracked.lod ||7173sourceExtensions.find(glslang::E_GL_AMD_texture_gather_bias_lod) != sourceExtensions.end()) {7174builder.addExtension(spv::E_SPV_AMD_texture_gather_bias_lod);7175builder.addCapability(spv::Capability::ImageGatherBiasLodAMD);7176}7177}71787179// set the rest of the arguments71807181params.coords = arguments[1];7182int extraArgs = 0;7183bool noImplicitLod = false;71847185// sort out where Dref is coming from7186if (cubeCompare || f16ShadowCompare) {7187params.Dref = arguments[2];7188++extraArgs;7189} else if (sampler.shadow && cracked.gather) {7190params.Dref = arguments[2];7191++extraArgs;7192} else if (sampler.shadow) {7193std::vector<spv::Id> indexes;7194int dRefComp;7195if (cracked.proj)7196dRefComp = 2; // "The resulting 3rd component of P in the shadow forms is used as Dref"7197else7198dRefComp = builder.getNumComponents(params.coords) - 1;7199indexes.push_back(dRefComp);7200params.Dref = builder.createCompositeExtract(params.coords,7201builder.getScalarTypeId(builder.getTypeId(params.coords)), indexes);7202}72037204// lod7205if (cracked.lod) {7206params.lod = arguments[2 + extraArgs];7207++extraArgs;7208} else if (glslangIntermediate->getStage() != EShLangFragment &&7209!(glslangIntermediate->getStage() == EShLangCompute &&7210glslangIntermediate->hasLayoutDerivativeModeNone())) {7211// we need to invent the default lod for an explicit lod instruction for a non-fragment stage7212noImplicitLod = true;7213}72147215// multisample7216if (sampler.isMultiSample()) {7217params.sample = arguments[2 + extraArgs]; // For MS, "sample" should be specified7218++extraArgs;7219}72207221// gradient7222if (cracked.grad) {7223params.gradX = arguments[2 + extraArgs];7224params.gradY = arguments[3 + extraArgs];7225extraArgs += 2;7226}72277228// offset and offsets7229if (cracked.offset) {7230params.offset = arguments[2 + extraArgs];7231++extraArgs;7232} else if (cracked.offsets) {7233params.offsets = arguments[2 + extraArgs];7234++extraArgs;7235}72367237// lod clamp7238if (cracked.lodClamp) {7239params.lodClamp = arguments[2 + extraArgs];7240++extraArgs;7241}7242// sparse7243if (sparse) {7244params.texelOut = arguments[2 + extraArgs];7245++extraArgs;7246}7247// gather component7248if (cracked.gather && ! sampler.shadow) {7249// default component is 0, if missing, otherwise an argument7250if (2 + extraArgs < (int)arguments.size()) {7251params.component = arguments[2 + extraArgs];7252++extraArgs;7253} else7254params.component = builder.makeIntConstant(0);7255}7256spv::Id resultStruct = spv::NoResult;7257if (imageFootprint) {7258//Following three extra arguments7259// int granularity, bool coarse, out gl_TextureFootprint2DNV footprint7260params.granularity = arguments[2 + extraArgs];7261params.coarse = arguments[3 + extraArgs];7262resultStruct = arguments[4 + extraArgs];7263extraArgs += 3;7264}72657266// bias7267if (bias) {7268params.bias = arguments[2 + extraArgs];7269++extraArgs;7270}72717272if (imageFootprint) {7273builder.addExtension(spv::E_SPV_NV_shader_image_footprint);7274builder.addCapability(spv::Capability::ImageFootprintNV);727572767277//resultStructType(OpenGL type) contains 5 elements:7278//struct gl_TextureFootprint2DNV {7279// uvec2 anchor;7280// uvec2 offset;7281// uvec2 mask;7282// uint lod;7283// uint granularity;7284//};7285//or7286//struct gl_TextureFootprint3DNV {7287// uvec3 anchor;7288// uvec3 offset;7289// uvec2 mask;7290// uint lod;7291// uint granularity;7292//};7293spv::Id resultStructType = builder.getContainedTypeId(builder.getTypeId(resultStruct));7294assert(builder.isStructType(resultStructType));72957296//resType (SPIR-V type) contains 6 elements:7297//Member 0 must be a Boolean type scalar(LOD),7298//Member 1 must be a vector of integer type, whose Signedness operand is 0(anchor),7299//Member 2 must be a vector of integer type, whose Signedness operand is 0(offset),7300//Member 3 must be a vector of integer type, whose Signedness operand is 0(mask),7301//Member 4 must be a scalar of integer type, whose Signedness operand is 0(lod),7302//Member 5 must be a scalar of integer type, whose Signedness operand is 0(granularity).7303std::vector<spv::Id> members;7304members.push_back(resultType());7305for (int i = 0; i < 5; i++) {7306members.push_back(builder.getContainedTypeId(resultStructType, i));7307}7308spv::Id resType = builder.makeStructType(members, {}, "ResType");73097310//call ImageFootprintNV7311spv::Id res = builder.createTextureCall(precision, resType, sparse, cracked.fetch, cracked.proj,7312cracked.gather, noImplicitLod, params, signExtensionMask());73137314//copy resType (SPIR-V type) to resultStructType(OpenGL type)7315for (int i = 0; i < 5; i++) {7316builder.clearAccessChain();7317builder.setAccessChainLValue(resultStruct);73187319//Accessing to a struct we created, no coherent flag is set7320spv::Builder::AccessChain::CoherentFlags flags;7321flags.clear();73227323builder.accessChainPush(builder.makeIntConstant(i), flags, 0);7324builder.accessChainStore(builder.createCompositeExtract(res, builder.getContainedTypeId(resType, i+1),7325i+1), TranslateNonUniformDecoration(imageType.getQualifier()));7326}7327return builder.createCompositeExtract(res, resultType(), 0);7328}73297330// projective component (might not to move)7331// GLSL: "The texture coordinates consumed from P, not including the last component of P,7332// are divided by the last component of P."7333// SPIR-V: "... (u [, v] [, w], q)... It may be a vector larger than needed, but all7334// unused components will appear after all used components."7335if (cracked.proj) {7336int projSourceComp = builder.getNumComponents(params.coords) - 1;7337int projTargetComp;7338switch (sampler.dim) {7339case glslang::Esd1D: projTargetComp = 1; break;7340case glslang::Esd2D: projTargetComp = 2; break;7341case glslang::EsdRect: projTargetComp = 2; break;7342default: projTargetComp = projSourceComp; break;7343}7344// copy the projective coordinate if we have to7345if (projTargetComp != projSourceComp) {7346spv::Id projComp = builder.createCompositeExtract(params.coords,7347builder.getScalarTypeId(builder.getTypeId(params.coords)), projSourceComp);7348params.coords = builder.createCompositeInsert(projComp, params.coords,7349builder.getTypeId(params.coords), projTargetComp);7350}7351}73527353// nonprivate7354if (imageType.getQualifier().nonprivate) {7355params.nonprivate = true;7356}73577358// volatile7359if (imageType.getQualifier().volatil) {7360params.volatil = true;7361}73627363if (imageType.getQualifier().nontemporal) {7364params.nontemporal = true;7365}73667367std::vector<spv::Id> result( 1,7368builder.createTextureCall(precision, resultType(), sparse, cracked.fetch, cracked.proj, cracked.gather,7369noImplicitLod, params, signExtensionMask())7370);73717372if (components != node->getType().getVectorSize())7373result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));73747375return result[0];7376}73777378spv::Id TGlslangToSpvTraverser::handleUserFunctionCall(const glslang::TIntermAggregate* node)7379{7380// Grab the function's pointer from the previously created function7381spv::Function* function = functionMap[node->getName().c_str()];7382if (! function)7383return 0;73847385const glslang::TIntermSequence& glslangArgs = node->getSequence();7386const glslang::TQualifierList& qualifiers = node->getQualifierList();73877388// See comments in makeFunctions() for details about the semantics for parameter passing.7389//7390// These imply we need a four step process:7391// 1. Evaluate the arguments7392// 2. Allocate and make copies of in, out, and inout arguments7393// 3. Make the call7394// 4. Copy back the results73957396// 1. Evaluate the arguments and their types7397std::vector<spv::Builder::AccessChain> lValues;7398std::vector<spv::Id> rValues;7399std::vector<const glslang::TType*> argTypes;7400for (int a = 0; a < (int)glslangArgs.size(); ++a) {7401argTypes.push_back(&glslangArgs[a]->getAsTyped()->getType());7402// build l-value7403builder.clearAccessChain();7404glslangArgs[a]->traverse(this);7405// keep outputs and pass-by-originals as l-values, evaluate others as r-values7406if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0) ||7407writableParam(qualifiers[a])) {7408// save l-value7409lValues.push_back(builder.getAccessChain());7410} else {7411// process r-value7412rValues.push_back(accessChainLoad(*argTypes.back()));7413}7414}74157416// Reset source location to the function call location after argument evaluation7417builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());74187419// 2. Allocate space for anything needing a copy, and if it's "in" or "inout"7420// copy the original into that space.7421//7422// Also, build up the list of actual arguments to pass in for the call7423int lValueCount = 0;7424int rValueCount = 0;7425std::vector<spv::Id> spvArgs;7426for (int a = 0; a < (int)glslangArgs.size(); ++a) {7427spv::Id arg;7428if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0)) {7429builder.setAccessChain(lValues[lValueCount]);7430arg = builder.accessChainGetLValue();7431++lValueCount;7432} else if (writableParam(qualifiers[a])) {7433// need space to hold the copy7434arg = builder.createVariable(function->getParamPrecision(a), spv::StorageClass::Function,7435builder.getContainedTypeId(function->getParamType(a)), "param");7436if (qualifiers[a] == glslang::EvqIn || qualifiers[a] == glslang::EvqInOut) {7437// need to copy the input into output space7438builder.setAccessChain(lValues[lValueCount]);7439spv::Id copy = accessChainLoad(*argTypes[a]);7440builder.clearAccessChain();7441builder.setAccessChainLValue(arg);7442multiTypeStore(*argTypes[a], copy);7443}7444++lValueCount;7445} else {7446// process r-value, which involves a copy for a type mismatch7447if (function->getParamType(a) != builder.getTypeId(rValues[rValueCount]) ||7448TranslatePrecisionDecoration(*argTypes[a]) != function->getParamPrecision(a))7449{7450spv::Id argCopy = builder.createVariable(function->getParamPrecision(a), spv::StorageClass::Function, function->getParamType(a), "arg");7451builder.clearAccessChain();7452builder.setAccessChainLValue(argCopy);7453multiTypeStore(*argTypes[a], rValues[rValueCount]);7454arg = builder.createLoad(argCopy, function->getParamPrecision(a));7455} else7456arg = rValues[rValueCount];7457++rValueCount;7458}7459spvArgs.push_back(arg);7460}74617462// 3. Make the call.7463spv::Id result = builder.createFunctionCall(function, spvArgs);7464builder.setPrecision(result, TranslatePrecisionDecoration(node->getType()));7465builder.addDecoration(result, TranslateNonUniformDecoration(node->getType().getQualifier()));74667467// 4. Copy back out an "out" arguments.7468lValueCount = 0;7469for (int a = 0; a < (int)glslangArgs.size(); ++a) {7470if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0))7471++lValueCount;7472else if (writableParam(qualifiers[a])) {7473if (qualifiers[a] == glslang::EvqOut || qualifiers[a] == glslang::EvqInOut) {7474spv::Id copy = builder.createLoad(spvArgs[a], spv::NoPrecision);7475builder.addDecoration(copy, TranslateNonUniformDecoration(argTypes[a]->getQualifier()));7476builder.setAccessChain(lValues[lValueCount]);7477multiTypeStore(*argTypes[a], copy);7478}7479++lValueCount;7480}7481}74827483return result;7484}74857486// Translate AST operation to SPV operation, already having SPV-based operands/types.7487spv::Id TGlslangToSpvTraverser::createBinaryOperation(glslang::TOperator op, OpDecorations& decorations,7488spv::Id typeId, spv::Id left, spv::Id right,7489glslang::TBasicType typeProxy, bool reduceComparison)7490{7491bool isUnsigned = isTypeUnsignedInt(typeProxy);7492bool isFloat = isTypeFloat(typeProxy);7493bool isBool = typeProxy == glslang::EbtBool;74947495spv::Op binOp = spv::Op::OpNop;7496bool needMatchingVectors = true; // for non-matrix ops, would a scalar need to smear to match a vector?7497bool comparison = false;74987499switch (op) {7500case glslang::EOpAdd:7501case glslang::EOpAddAssign:7502if (isFloat)7503binOp = spv::Op::OpFAdd;7504else7505binOp = spv::Op::OpIAdd;7506break;7507case glslang::EOpSub:7508case glslang::EOpSubAssign:7509if (isFloat)7510binOp = spv::Op::OpFSub;7511else7512binOp = spv::Op::OpISub;7513break;7514case glslang::EOpMul:7515case glslang::EOpMulAssign:7516if (isFloat)7517binOp = spv::Op::OpFMul;7518else7519binOp = spv::Op::OpIMul;7520break;7521case glslang::EOpVectorTimesScalar:7522case glslang::EOpVectorTimesScalarAssign:7523if (isFloat && (builder.isVector(left) || builder.isVector(right) || builder.isCooperativeVector(left) || builder.isCooperativeVector(right))) {7524if (builder.isVector(right) || builder.isCooperativeVector(right))7525std::swap(left, right);7526assert(builder.isScalar(right));7527needMatchingVectors = false;7528binOp = spv::Op::OpVectorTimesScalar;7529} else if (isFloat) {7530binOp = spv::Op::OpFMul;7531} else if (builder.isCooperativeVector(left) || builder.isCooperativeVector(right)) {7532if (builder.isCooperativeVector(right))7533std::swap(left, right);7534assert(builder.isScalar(right));7535// Construct a cooperative vector from the scalar7536right = builder.createCompositeConstruct(builder.getTypeId(left), { right });7537binOp = spv::Op::OpIMul;7538} else {7539binOp = spv::Op::OpIMul;7540}7541break;7542case glslang::EOpVectorTimesMatrix:7543case glslang::EOpVectorTimesMatrixAssign:7544binOp = spv::Op::OpVectorTimesMatrix;7545break;7546case glslang::EOpMatrixTimesVector:7547binOp = spv::Op::OpMatrixTimesVector;7548break;7549case glslang::EOpMatrixTimesScalar:7550case glslang::EOpMatrixTimesScalarAssign:7551binOp = spv::Op::OpMatrixTimesScalar;7552break;7553case glslang::EOpMatrixTimesMatrix:7554case glslang::EOpMatrixTimesMatrixAssign:7555binOp = spv::Op::OpMatrixTimesMatrix;7556break;7557case glslang::EOpOuterProduct:7558binOp = spv::Op::OpOuterProduct;7559needMatchingVectors = false;7560break;75617562case glslang::EOpDiv:7563case glslang::EOpDivAssign:7564if (isFloat)7565binOp = spv::Op::OpFDiv;7566else if (isUnsigned)7567binOp = spv::Op::OpUDiv;7568else7569binOp = spv::Op::OpSDiv;7570break;7571case glslang::EOpMod:7572case glslang::EOpModAssign:7573if (isFloat)7574binOp = spv::Op::OpFMod;7575else if (isUnsigned)7576binOp = spv::Op::OpUMod;7577else7578binOp = spv::Op::OpSMod;7579break;7580case glslang::EOpRightShift:7581case glslang::EOpRightShiftAssign:7582if (isUnsigned)7583binOp = spv::Op::OpShiftRightLogical;7584else7585binOp = spv::Op::OpShiftRightArithmetic;7586break;7587case glslang::EOpLeftShift:7588case glslang::EOpLeftShiftAssign:7589binOp = spv::Op::OpShiftLeftLogical;7590break;7591case glslang::EOpAnd:7592case glslang::EOpAndAssign:7593binOp = spv::Op::OpBitwiseAnd;7594break;7595case glslang::EOpLogicalAnd:7596needMatchingVectors = false;7597binOp = spv::Op::OpLogicalAnd;7598break;7599case glslang::EOpInclusiveOr:7600case glslang::EOpInclusiveOrAssign:7601binOp = spv::Op::OpBitwiseOr;7602break;7603case glslang::EOpLogicalOr:7604needMatchingVectors = false;7605binOp = spv::Op::OpLogicalOr;7606break;7607case glslang::EOpExclusiveOr:7608case glslang::EOpExclusiveOrAssign:7609binOp = spv::Op::OpBitwiseXor;7610break;7611case glslang::EOpLogicalXor:7612needMatchingVectors = false;7613binOp = spv::Op::OpLogicalNotEqual;7614break;76157616case glslang::EOpAbsDifference:7617binOp = isUnsigned ? spv::Op::OpAbsUSubINTEL : spv::Op::OpAbsISubINTEL;7618break;76197620case glslang::EOpAddSaturate:7621binOp = isUnsigned ? spv::Op::OpUAddSatINTEL : spv::Op::OpIAddSatINTEL;7622break;76237624case glslang::EOpSubSaturate:7625binOp = isUnsigned ? spv::Op::OpUSubSatINTEL : spv::Op::OpISubSatINTEL;7626break;76277628case glslang::EOpAverage:7629binOp = isUnsigned ? spv::Op::OpUAverageINTEL : spv::Op::OpIAverageINTEL;7630break;76317632case glslang::EOpAverageRounded:7633binOp = isUnsigned ? spv::Op::OpUAverageRoundedINTEL : spv::Op::OpIAverageRoundedINTEL;7634break;76357636case glslang::EOpMul32x16:7637binOp = isUnsigned ? spv::Op::OpUMul32x16INTEL : spv::Op::OpIMul32x16INTEL;7638break;76397640case glslang::EOpExpectEXT:7641binOp = spv::Op::OpExpectKHR;7642break;76437644case glslang::EOpLessThan:7645case glslang::EOpGreaterThan:7646case glslang::EOpLessThanEqual:7647case glslang::EOpGreaterThanEqual:7648case glslang::EOpEqual:7649case glslang::EOpNotEqual:7650case glslang::EOpVectorEqual:7651case glslang::EOpVectorNotEqual:7652comparison = true;7653break;7654default:7655break;7656}76577658// handle mapped binary operations (should be non-comparison)7659if (binOp != spv::Op::OpNop) {7660assert(comparison == false);7661if (builder.isMatrix(left) || builder.isMatrix(right) ||7662builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))7663return createBinaryMatrixOperation(binOp, decorations, typeId, left, right);76647665// No matrix involved; make both operands be the same number of components, if needed7666if (needMatchingVectors)7667builder.promoteScalar(decorations.precision, left, right);76687669spv::Id result = builder.createBinOp(binOp, typeId, left, right);7670decorations.addNoContraction(builder, result);7671decorations.addNonUniform(builder, result);7672return builder.setPrecision(result, decorations.precision);7673}76747675if (! comparison)7676return 0;76777678// Handle comparison instructions76797680if (reduceComparison && (op == glslang::EOpEqual || op == glslang::EOpNotEqual)7681&& (builder.isVector(left) || builder.isMatrix(left) || builder.isAggregate(left))) {7682spv::Id result = builder.createCompositeCompare(decorations.precision, left, right, op == glslang::EOpEqual);7683decorations.addNonUniform(builder, result);7684return result;7685}76867687switch (op) {7688case glslang::EOpLessThan:7689if (isFloat)7690binOp = spv::Op::OpFOrdLessThan;7691else if (isUnsigned)7692binOp = spv::Op::OpULessThan;7693else7694binOp = spv::Op::OpSLessThan;7695break;7696case glslang::EOpGreaterThan:7697if (isFloat)7698binOp = spv::Op::OpFOrdGreaterThan;7699else if (isUnsigned)7700binOp = spv::Op::OpUGreaterThan;7701else7702binOp = spv::Op::OpSGreaterThan;7703break;7704case glslang::EOpLessThanEqual:7705if (isFloat)7706binOp = spv::Op::OpFOrdLessThanEqual;7707else if (isUnsigned)7708binOp = spv::Op::OpULessThanEqual;7709else7710binOp = spv::Op::OpSLessThanEqual;7711break;7712case glslang::EOpGreaterThanEqual:7713if (isFloat)7714binOp = spv::Op::OpFOrdGreaterThanEqual;7715else if (isUnsigned)7716binOp = spv::Op::OpUGreaterThanEqual;7717else7718binOp = spv::Op::OpSGreaterThanEqual;7719break;7720case glslang::EOpEqual:7721case glslang::EOpVectorEqual:7722if (isFloat)7723binOp = spv::Op::OpFOrdEqual;7724else if (isBool)7725binOp = spv::Op::OpLogicalEqual;7726else7727binOp = spv::Op::OpIEqual;7728break;7729case glslang::EOpNotEqual:7730case glslang::EOpVectorNotEqual:7731if (isFloat)7732binOp = spv::Op::OpFUnordNotEqual;7733else if (isBool)7734binOp = spv::Op::OpLogicalNotEqual;7735else7736binOp = spv::Op::OpINotEqual;7737break;7738default:7739break;7740}77417742if (binOp != spv::Op::OpNop) {7743spv::Id result = builder.createBinOp(binOp, typeId, left, right);7744decorations.addNoContraction(builder, result);7745decorations.addNonUniform(builder, result);7746return builder.setPrecision(result, decorations.precision);7747}77487749return 0;7750}77517752//7753// Translate AST matrix operation to SPV operation, already having SPV-based operands/types.7754// These can be any of:7755//7756// matrix * scalar7757// scalar * matrix7758// matrix * matrix linear algebraic7759// matrix * vector7760// vector * matrix7761// matrix * matrix componentwise7762// matrix op matrix op in {+, -, /}7763// matrix op scalar op in {+, -, /}7764// scalar op matrix op in {+, -, /}7765//7766spv::Id TGlslangToSpvTraverser::createBinaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,7767spv::Id left, spv::Id right)7768{7769bool firstClass = true;77707771// First, handle first-class matrix operations (* and matrix/scalar)7772switch (op) {7773case spv::Op::OpFDiv:7774if (builder.isMatrix(left) && builder.isScalar(right)) {7775// turn matrix / scalar into a multiply...7776spv::Id resultType = builder.getTypeId(right);7777right = builder.createBinOp(spv::Op::OpFDiv, resultType, builder.makeFpConstant(resultType, 1.0), right);7778op = spv::Op::OpMatrixTimesScalar;7779} else7780firstClass = false;7781break;7782case spv::Op::OpMatrixTimesScalar:7783if (builder.isMatrix(right) || builder.isCooperativeMatrix(right))7784std::swap(left, right);7785assert(builder.isScalar(right));7786break;7787case spv::Op::OpVectorTimesMatrix:7788assert(builder.isVector(left));7789assert(builder.isMatrix(right));7790break;7791case spv::Op::OpMatrixTimesVector:7792assert(builder.isMatrix(left));7793assert(builder.isVector(right));7794break;7795case spv::Op::OpMatrixTimesMatrix:7796assert(builder.isMatrix(left));7797assert(builder.isMatrix(right));7798break;7799default:7800firstClass = false;7801break;7802}78037804if (builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))7805firstClass = true;78067807if (firstClass) {7808spv::Id result = builder.createBinOp(op, typeId, left, right);7809decorations.addNoContraction(builder, result);7810decorations.addNonUniform(builder, result);7811return builder.setPrecision(result, decorations.precision);7812}78137814// Handle component-wise +, -, *, %, and / for all combinations of type.7815// The result type of all of them is the same type as the (a) matrix operand.7816// The algorithm is to:7817// - break the matrix(es) into vectors7818// - smear any scalar to a vector7819// - do vector operations7820// - make a matrix out the vector results7821switch (op) {7822case spv::Op::OpFAdd:7823case spv::Op::OpFSub:7824case spv::Op::OpFDiv:7825case spv::Op::OpFMod:7826case spv::Op::OpFMul:7827{7828// one time set up...7829bool leftMat = builder.isMatrix(left);7830bool rightMat = builder.isMatrix(right);7831unsigned int numCols = leftMat ? builder.getNumColumns(left) : builder.getNumColumns(right);7832int numRows = leftMat ? builder.getNumRows(left) : builder.getNumRows(right);7833spv::Id scalarType = builder.getScalarTypeId(typeId);7834spv::Id vecType = builder.makeVectorType(scalarType, numRows);7835std::vector<spv::Id> results;7836spv::Id smearVec = spv::NoResult;7837if (builder.isScalar(left))7838smearVec = builder.smearScalar(decorations.precision, left, vecType);7839else if (builder.isScalar(right))7840smearVec = builder.smearScalar(decorations.precision, right, vecType);78417842// do each vector op7843for (unsigned int c = 0; c < numCols; ++c) {7844std::vector<unsigned int> indexes;7845indexes.push_back(c);7846spv::Id leftVec = leftMat ? builder.createCompositeExtract( left, vecType, indexes) : smearVec;7847spv::Id rightVec = rightMat ? builder.createCompositeExtract(right, vecType, indexes) : smearVec;7848spv::Id result = builder.createBinOp(op, vecType, leftVec, rightVec);7849decorations.addNoContraction(builder, result);7850decorations.addNonUniform(builder, result);7851results.push_back(builder.setPrecision(result, decorations.precision));7852}78537854// put the pieces together7855spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);7856decorations.addNonUniform(builder, result);7857return result;7858}7859default:7860assert(0);7861return spv::NoResult;7862}7863}78647865spv::Id TGlslangToSpvTraverser::createUnaryOperation(glslang::TOperator op, OpDecorations& decorations, spv::Id typeId,7866spv::Id operand, glslang::TBasicType typeProxy, const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,7867const glslang::TType &opType)7868{7869spv::Op unaryOp = spv::Op::OpNop;7870int extBuiltins = -1;7871int libCall = -1;7872bool isUnsigned = isTypeUnsignedInt(typeProxy);7873bool isFloat = isTypeFloat(typeProxy);78747875switch (op) {7876case glslang::EOpNegative:7877if (isFloat) {7878unaryOp = spv::Op::OpFNegate;7879if (builder.isMatrixType(typeId))7880return createUnaryMatrixOperation(unaryOp, decorations, typeId, operand, typeProxy);7881} else7882unaryOp = spv::Op::OpSNegate;7883break;78847885case glslang::EOpLogicalNot:7886case glslang::EOpVectorLogicalNot:7887unaryOp = spv::Op::OpLogicalNot;7888break;7889case glslang::EOpBitwiseNot:7890unaryOp = spv::Op::OpNot;7891break;78927893case glslang::EOpDeterminant:7894libCall = spv::GLSLstd450Determinant;7895break;7896case glslang::EOpMatrixInverse:7897libCall = spv::GLSLstd450MatrixInverse;7898break;7899case glslang::EOpTranspose:7900unaryOp = spv::Op::OpTranspose;7901break;79027903case glslang::EOpRadians:7904libCall = spv::GLSLstd450Radians;7905break;7906case glslang::EOpDegrees:7907libCall = spv::GLSLstd450Degrees;7908break;7909case glslang::EOpSin:7910libCall = spv::GLSLstd450Sin;7911break;7912case glslang::EOpCos:7913libCall = spv::GLSLstd450Cos;7914break;7915case glslang::EOpTan:7916libCall = spv::GLSLstd450Tan;7917break;7918case glslang::EOpAcos:7919libCall = spv::GLSLstd450Acos;7920break;7921case glslang::EOpAsin:7922libCall = spv::GLSLstd450Asin;7923break;7924case glslang::EOpAtan:7925libCall = spv::GLSLstd450Atan;7926break;79277928case glslang::EOpAcosh:7929libCall = spv::GLSLstd450Acosh;7930break;7931case glslang::EOpAsinh:7932libCall = spv::GLSLstd450Asinh;7933break;7934case glslang::EOpAtanh:7935libCall = spv::GLSLstd450Atanh;7936break;7937case glslang::EOpTanh:7938libCall = spv::GLSLstd450Tanh;7939break;7940case glslang::EOpCosh:7941libCall = spv::GLSLstd450Cosh;7942break;7943case glslang::EOpSinh:7944libCall = spv::GLSLstd450Sinh;7945break;79467947case glslang::EOpLength:7948libCall = spv::GLSLstd450Length;7949break;7950case glslang::EOpNormalize:7951libCall = spv::GLSLstd450Normalize;7952break;79537954case glslang::EOpExp:7955libCall = spv::GLSLstd450Exp;7956break;7957case glslang::EOpLog:7958libCall = spv::GLSLstd450Log;7959break;7960case glslang::EOpExp2:7961libCall = spv::GLSLstd450Exp2;7962break;7963case glslang::EOpLog2:7964libCall = spv::GLSLstd450Log2;7965break;7966case glslang::EOpSqrt:7967libCall = spv::GLSLstd450Sqrt;7968break;7969case glslang::EOpInverseSqrt:7970libCall = spv::GLSLstd450InverseSqrt;7971break;79727973case glslang::EOpFloor:7974libCall = spv::GLSLstd450Floor;7975break;7976case glslang::EOpTrunc:7977libCall = spv::GLSLstd450Trunc;7978break;7979case glslang::EOpRound:7980libCall = spv::GLSLstd450Round;7981break;7982case glslang::EOpRoundEven:7983libCall = spv::GLSLstd450RoundEven;7984break;7985case glslang::EOpCeil:7986libCall = spv::GLSLstd450Ceil;7987break;7988case glslang::EOpFract:7989libCall = spv::GLSLstd450Fract;7990break;79917992case glslang::EOpIsNan:7993unaryOp = spv::Op::OpIsNan;7994break;7995case glslang::EOpIsInf:7996unaryOp = spv::Op::OpIsInf;7997break;7998case glslang::EOpIsFinite:7999unaryOp = spv::Op::OpIsFinite;8000break;80018002case glslang::EOpFloatBitsToInt:8003case glslang::EOpFloatBitsToUint:8004case glslang::EOpIntBitsToFloat:8005case glslang::EOpUintBitsToFloat:8006case glslang::EOpDoubleBitsToInt64:8007case glslang::EOpDoubleBitsToUint64:8008case glslang::EOpInt64BitsToDouble:8009case glslang::EOpUint64BitsToDouble:8010case glslang::EOpFloat16BitsToInt16:8011case glslang::EOpFloat16BitsToUint16:8012case glslang::EOpInt16BitsToFloat16:8013case glslang::EOpUint16BitsToFloat16:8014unaryOp = spv::Op::OpBitcast;8015break;80168017case glslang::EOpPackSnorm2x16:8018libCall = spv::GLSLstd450PackSnorm2x16;8019break;8020case glslang::EOpUnpackSnorm2x16:8021libCall = spv::GLSLstd450UnpackSnorm2x16;8022break;8023case glslang::EOpPackUnorm2x16:8024libCall = spv::GLSLstd450PackUnorm2x16;8025break;8026case glslang::EOpUnpackUnorm2x16:8027libCall = spv::GLSLstd450UnpackUnorm2x16;8028break;8029case glslang::EOpPackHalf2x16:8030libCall = spv::GLSLstd450PackHalf2x16;8031break;8032case glslang::EOpUnpackHalf2x16:8033libCall = spv::GLSLstd450UnpackHalf2x16;8034break;8035case glslang::EOpPackSnorm4x8:8036libCall = spv::GLSLstd450PackSnorm4x8;8037break;8038case glslang::EOpUnpackSnorm4x8:8039libCall = spv::GLSLstd450UnpackSnorm4x8;8040break;8041case glslang::EOpPackUnorm4x8:8042libCall = spv::GLSLstd450PackUnorm4x8;8043break;8044case glslang::EOpUnpackUnorm4x8:8045libCall = spv::GLSLstd450UnpackUnorm4x8;8046break;8047case glslang::EOpPackDouble2x32:8048libCall = spv::GLSLstd450PackDouble2x32;8049break;8050case glslang::EOpUnpackDouble2x32:8051libCall = spv::GLSLstd450UnpackDouble2x32;8052break;80538054case glslang::EOpPackInt2x32:8055case glslang::EOpUnpackInt2x32:8056case glslang::EOpPackUint2x32:8057case glslang::EOpUnpackUint2x32:8058case glslang::EOpPack16:8059case glslang::EOpPack32:8060case glslang::EOpPack64:8061case glslang::EOpUnpack32:8062case glslang::EOpUnpack16:8063case glslang::EOpUnpack8:8064case glslang::EOpPackInt2x16:8065case glslang::EOpUnpackInt2x16:8066case glslang::EOpPackUint2x16:8067case glslang::EOpUnpackUint2x16:8068case glslang::EOpPackInt4x16:8069case glslang::EOpUnpackInt4x16:8070case glslang::EOpPackUint4x16:8071case glslang::EOpUnpackUint4x16:8072case glslang::EOpPackFloat2x16:8073case glslang::EOpUnpackFloat2x16:8074unaryOp = spv::Op::OpBitcast;8075break;80768077case glslang::EOpDPdx:8078unaryOp = spv::Op::OpDPdx;8079break;8080case glslang::EOpDPdy:8081unaryOp = spv::Op::OpDPdy;8082break;8083case glslang::EOpFwidth:8084unaryOp = spv::Op::OpFwidth;8085break;80868087case glslang::EOpAny:8088unaryOp = spv::Op::OpAny;8089break;8090case glslang::EOpAll:8091unaryOp = spv::Op::OpAll;8092break;80938094case glslang::EOpAbs:8095if (isFloat)8096libCall = spv::GLSLstd450FAbs;8097else8098libCall = spv::GLSLstd450SAbs;8099break;8100case glslang::EOpSign:8101if (isFloat)8102libCall = spv::GLSLstd450FSign;8103else8104libCall = spv::GLSLstd450SSign;8105break;81068107case glslang::EOpDPdxFine:8108unaryOp = spv::Op::OpDPdxFine;8109break;8110case glslang::EOpDPdyFine:8111unaryOp = spv::Op::OpDPdyFine;8112break;8113case glslang::EOpFwidthFine:8114unaryOp = spv::Op::OpFwidthFine;8115break;8116case glslang::EOpDPdxCoarse:8117unaryOp = spv::Op::OpDPdxCoarse;8118break;8119case glslang::EOpDPdyCoarse:8120unaryOp = spv::Op::OpDPdyCoarse;8121break;8122case glslang::EOpFwidthCoarse:8123unaryOp = spv::Op::OpFwidthCoarse;8124break;8125case glslang::EOpRayQueryProceed:8126unaryOp = spv::Op::OpRayQueryProceedKHR;8127break;8128case glslang::EOpRayQueryGetRayTMin:8129unaryOp = spv::Op::OpRayQueryGetRayTMinKHR;8130break;8131case glslang::EOpRayQueryGetRayFlags:8132unaryOp = spv::Op::OpRayQueryGetRayFlagsKHR;8133break;8134case glslang::EOpRayQueryGetWorldRayOrigin:8135unaryOp = spv::Op::OpRayQueryGetWorldRayOriginKHR;8136break;8137case glslang::EOpRayQueryGetWorldRayDirection:8138unaryOp = spv::Op::OpRayQueryGetWorldRayDirectionKHR;8139break;8140case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:8141unaryOp = spv::Op::OpRayQueryGetIntersectionCandidateAABBOpaqueKHR;8142break;8143case glslang::EOpInterpolateAtCentroid:8144if (typeProxy == glslang::EbtFloat16)8145builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);8146libCall = spv::GLSLstd450InterpolateAtCentroid;8147break;8148case glslang::EOpAtomicCounterIncrement:8149case glslang::EOpAtomicCounterDecrement:8150case glslang::EOpAtomicCounter:8151{8152// Handle all of the atomics in one place, in createAtomicOperation()8153std::vector<spv::Id> operands;8154operands.push_back(operand);8155return createAtomicOperation(op, decorations.precision, typeId, operands, typeProxy, lvalueCoherentFlags, opType);8156}81578158case glslang::EOpBitFieldReverse:8159unaryOp = spv::Op::OpBitReverse;8160break;8161case glslang::EOpBitCount:8162unaryOp = spv::Op::OpBitCount;8163break;8164case glslang::EOpFindLSB:8165libCall = spv::GLSLstd450FindILsb;8166break;8167case glslang::EOpFindMSB:8168if (isUnsigned)8169libCall = spv::GLSLstd450FindUMsb;8170else8171libCall = spv::GLSLstd450FindSMsb;8172break;81738174case glslang::EOpCountLeadingZeros:8175builder.addCapability(spv::Capability::IntegerFunctions2INTEL);8176builder.addExtension("SPV_INTEL_shader_integer_functions2");8177unaryOp = spv::Op::OpUCountLeadingZerosINTEL;8178break;81798180case glslang::EOpCountTrailingZeros:8181builder.addCapability(spv::Capability::IntegerFunctions2INTEL);8182builder.addExtension("SPV_INTEL_shader_integer_functions2");8183unaryOp = spv::Op::OpUCountTrailingZerosINTEL;8184break;81858186case glslang::EOpBallot:8187case glslang::EOpReadFirstInvocation:8188case glslang::EOpAnyInvocation:8189case glslang::EOpAllInvocations:8190case glslang::EOpAllInvocationsEqual:8191case glslang::EOpMinInvocations:8192case glslang::EOpMaxInvocations:8193case glslang::EOpAddInvocations:8194case glslang::EOpMinInvocationsNonUniform:8195case glslang::EOpMaxInvocationsNonUniform:8196case glslang::EOpAddInvocationsNonUniform:8197case glslang::EOpMinInvocationsInclusiveScan:8198case glslang::EOpMaxInvocationsInclusiveScan:8199case glslang::EOpAddInvocationsInclusiveScan:8200case glslang::EOpMinInvocationsInclusiveScanNonUniform:8201case glslang::EOpMaxInvocationsInclusiveScanNonUniform:8202case glslang::EOpAddInvocationsInclusiveScanNonUniform:8203case glslang::EOpMinInvocationsExclusiveScan:8204case glslang::EOpMaxInvocationsExclusiveScan:8205case glslang::EOpAddInvocationsExclusiveScan:8206case glslang::EOpMinInvocationsExclusiveScanNonUniform:8207case glslang::EOpMaxInvocationsExclusiveScanNonUniform:8208case glslang::EOpAddInvocationsExclusiveScanNonUniform:8209{8210std::vector<spv::Id> operands;8211operands.push_back(operand);8212return createInvocationsOperation(op, typeId, operands, typeProxy);8213}8214case glslang::EOpSubgroupAll:8215case glslang::EOpSubgroupAny:8216case glslang::EOpSubgroupAllEqual:8217case glslang::EOpSubgroupBroadcastFirst:8218case glslang::EOpSubgroupBallot:8219case glslang::EOpSubgroupInverseBallot:8220case glslang::EOpSubgroupBallotBitCount:8221case glslang::EOpSubgroupBallotInclusiveBitCount:8222case glslang::EOpSubgroupBallotExclusiveBitCount:8223case glslang::EOpSubgroupBallotFindLSB:8224case glslang::EOpSubgroupBallotFindMSB:8225case glslang::EOpSubgroupAdd:8226case glslang::EOpSubgroupMul:8227case glslang::EOpSubgroupMin:8228case glslang::EOpSubgroupMax:8229case glslang::EOpSubgroupAnd:8230case glslang::EOpSubgroupOr:8231case glslang::EOpSubgroupXor:8232case glslang::EOpSubgroupInclusiveAdd:8233case glslang::EOpSubgroupInclusiveMul:8234case glslang::EOpSubgroupInclusiveMin:8235case glslang::EOpSubgroupInclusiveMax:8236case glslang::EOpSubgroupInclusiveAnd:8237case glslang::EOpSubgroupInclusiveOr:8238case glslang::EOpSubgroupInclusiveXor:8239case glslang::EOpSubgroupExclusiveAdd:8240case glslang::EOpSubgroupExclusiveMul:8241case glslang::EOpSubgroupExclusiveMin:8242case glslang::EOpSubgroupExclusiveMax:8243case glslang::EOpSubgroupExclusiveAnd:8244case glslang::EOpSubgroupExclusiveOr:8245case glslang::EOpSubgroupExclusiveXor:8246case glslang::EOpSubgroupQuadSwapHorizontal:8247case glslang::EOpSubgroupQuadSwapVertical:8248case glslang::EOpSubgroupQuadSwapDiagonal:8249case glslang::EOpSubgroupQuadAll:8250case glslang::EOpSubgroupQuadAny: {8251std::vector<spv::Id> operands;8252operands.push_back(operand);8253return createSubgroupOperation(op, typeId, operands, typeProxy);8254}8255case glslang::EOpMbcnt:8256extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);8257libCall = spv::MbcntAMD;8258break;82598260case glslang::EOpCubeFaceIndex:8261extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);8262libCall = spv::CubeFaceIndexAMD;8263break;82648265case glslang::EOpCubeFaceCoord:8266extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);8267libCall = spv::CubeFaceCoordAMD;8268break;8269case glslang::EOpSubgroupPartition:8270unaryOp = spv::Op::OpGroupNonUniformPartitionNV;8271break;8272case glslang::EOpConstructReference:8273unaryOp = spv::Op::OpBitcast;8274break;82758276case glslang::EOpConvUint64ToAccStruct:8277case glslang::EOpConvUvec2ToAccStruct:8278unaryOp = spv::Op::OpConvertUToAccelerationStructureKHR;8279break;82808281case glslang::EOpHitObjectIsEmptyNV:8282unaryOp = spv::Op::OpHitObjectIsEmptyNV;8283break;82848285case glslang::EOpHitObjectIsEmptyEXT:8286unaryOp = spv::Op::OpHitObjectIsEmptyEXT;8287break;82888289case glslang::EOpHitObjectIsMissNV:8290unaryOp = spv::Op::OpHitObjectIsMissNV;8291break;82928293case glslang::EOpHitObjectIsMissEXT:8294unaryOp = spv::Op::OpHitObjectIsMissEXT;8295break;82968297case glslang::EOpHitObjectIsHitNV:8298unaryOp = spv::Op::OpHitObjectIsHitNV;8299break;83008301case glslang::EOpHitObjectIsHitEXT:8302unaryOp = spv::Op::OpHitObjectIsHitEXT;8303break;83048305case glslang::EOpHitObjectGetObjectRayOriginNV:8306unaryOp = spv::Op::OpHitObjectGetObjectRayOriginNV;8307break;83088309case glslang::EOpHitObjectGetObjectRayOriginEXT:8310unaryOp = spv::Op::OpHitObjectGetObjectRayOriginEXT;8311break;83128313case glslang::EOpHitObjectGetObjectRayDirectionNV:8314unaryOp = spv::Op::OpHitObjectGetObjectRayDirectionNV;8315break;83168317case glslang::EOpHitObjectGetObjectRayDirectionEXT:8318unaryOp = spv::Op::OpHitObjectGetObjectRayDirectionEXT;8319break;83208321case glslang::EOpHitObjectGetWorldRayOriginNV:8322unaryOp = spv::Op::OpHitObjectGetWorldRayOriginNV;8323break;83248325case glslang::EOpHitObjectGetWorldRayOriginEXT:8326unaryOp = spv::Op::OpHitObjectGetWorldRayOriginEXT;8327break;83288329case glslang::EOpHitObjectGetWorldRayDirectionNV:8330unaryOp = spv::Op::OpHitObjectGetWorldRayDirectionNV;8331break;83328333case glslang::EOpHitObjectGetWorldRayDirectionEXT:8334unaryOp = spv::Op::OpHitObjectGetWorldRayDirectionEXT;8335break;83368337case glslang::EOpHitObjectGetObjectToWorldNV:8338unaryOp = spv::Op::OpHitObjectGetObjectToWorldNV;8339break;83408341case glslang::EOpHitObjectGetObjectToWorldEXT:8342unaryOp = spv::Op::OpHitObjectGetObjectToWorldEXT;8343break;83448345case glslang::EOpHitObjectGetWorldToObjectNV:8346unaryOp = spv::Op::OpHitObjectGetWorldToObjectNV;8347break;83488349case glslang::EOpHitObjectGetWorldToObjectEXT:8350unaryOp = spv::Op::OpHitObjectGetWorldToObjectEXT;8351break;83528353case glslang::EOpHitObjectGetRayTMinNV:8354unaryOp = spv::Op::OpHitObjectGetRayTMinNV;8355break;83568357case glslang::EOpHitObjectGetRayTMinEXT:8358unaryOp = spv::Op::OpHitObjectGetRayTMinEXT;8359break;83608361case glslang::EOpHitObjectGetRayTMaxNV:8362unaryOp = spv::Op::OpHitObjectGetRayTMaxNV;8363break;83648365case glslang::EOpHitObjectGetRayTMaxEXT:8366unaryOp = spv::Op::OpHitObjectGetRayTMaxEXT;8367break;83688369case glslang::EOpHitObjectGetRayFlagsEXT:8370unaryOp = spv::Op::OpHitObjectGetRayFlagsEXT;8371break;83728373case glslang::EOpHitObjectGetPrimitiveIndexNV:8374unaryOp = spv::Op::OpHitObjectGetPrimitiveIndexNV;8375break;83768377case glslang::EOpHitObjectGetPrimitiveIndexEXT:8378unaryOp = spv::Op::OpHitObjectGetPrimitiveIndexEXT;8379break;83808381case glslang::EOpHitObjectGetInstanceIdNV:8382unaryOp = spv::Op::OpHitObjectGetInstanceIdNV;8383break;83848385case glslang::EOpHitObjectGetInstanceIdEXT:8386unaryOp = spv::Op::OpHitObjectGetInstanceIdEXT;8387break;83888389case glslang::EOpHitObjectGetInstanceCustomIndexNV:8390unaryOp = spv::Op::OpHitObjectGetInstanceCustomIndexNV;8391break;83928393case glslang::EOpHitObjectGetInstanceCustomIndexEXT:8394unaryOp = spv::Op::OpHitObjectGetInstanceCustomIndexEXT;8395break;83968397case glslang::EOpHitObjectGetGeometryIndexNV:8398unaryOp = spv::Op::OpHitObjectGetGeometryIndexNV;8399break;84008401case glslang::EOpHitObjectGetGeometryIndexEXT:8402unaryOp = spv::Op::OpHitObjectGetGeometryIndexEXT;8403break;84048405case glslang::EOpHitObjectGetHitKindNV:8406unaryOp = spv::Op::OpHitObjectGetHitKindNV;8407break;84088409case glslang::EOpHitObjectGetHitKindEXT:8410unaryOp = spv::Op::OpHitObjectGetHitKindEXT;8411break;84128413case glslang::EOpHitObjectGetCurrentTimeNV:8414unaryOp = spv::Op::OpHitObjectGetCurrentTimeNV;8415break;84168417case glslang::EOpHitObjectGetCurrentTimeEXT:8418unaryOp = spv::Op::OpHitObjectGetCurrentTimeEXT;8419break;84208421case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:8422unaryOp = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexNV;8423break;84248425case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:8426unaryOp = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexEXT;8427break;84288429case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:8430unaryOp = spv::Op::OpHitObjectGetShaderRecordBufferHandleNV;8431break;84328433case glslang::EOpHitObjectGetClusterIdNV:8434unaryOp = spv::Op::OpHitObjectGetClusterIdNV;8435builder.addExtension(spv::E_SPV_NV_cluster_acceleration_structure);8436builder.addCapability(spv::Capability::ShaderInvocationReorderNV);8437builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);8438break;84398440case glslang::EOpHitObjectGetSpherePositionNV:8441unaryOp = spv::Op::OpHitObjectGetSpherePositionNV;8442builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);8443builder.addCapability(spv::Capability::ShaderInvocationReorderNV);8444builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);8445break;84468447case glslang::EOpHitObjectGetSphereRadiusNV:8448unaryOp = spv::Op::OpHitObjectGetSphereRadiusNV;8449builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);8450builder.addCapability(spv::Capability::ShaderInvocationReorderNV);8451builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);8452break;84538454case glslang::EOpHitObjectIsSphereHitNV:8455unaryOp = spv::Op::OpHitObjectIsSphereHitNV;8456builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);8457builder.addCapability(spv::Capability::ShaderInvocationReorderNV);8458builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);8459break;84608461case glslang::EOpHitObjectIsLSSHitNV:8462unaryOp = spv::Op::OpHitObjectIsLSSHitNV;8463builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);8464builder.addCapability(spv::Capability::ShaderInvocationReorderNV);8465builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);8466break;84678468case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:8469unaryOp = spv::Op::OpHitObjectGetShaderRecordBufferHandleEXT;8470break;84718472case glslang::EOpFetchMicroTriangleVertexPositionNV:8473unaryOp = spv::Op::OpFetchMicroTriangleVertexPositionNV;8474break;84758476case glslang::EOpFetchMicroTriangleVertexBarycentricNV:8477unaryOp = spv::Op::OpFetchMicroTriangleVertexBarycentricNV;8478break;84798480case glslang::EOpCopyObject:8481unaryOp = spv::Op::OpCopyObject;8482break;84838484case glslang::EOpDepthAttachmentReadEXT:8485builder.addExtension(spv::E_SPV_EXT_shader_tile_image);8486builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);8487unaryOp = spv::Op::OpDepthAttachmentReadEXT;8488decorations.precision = spv::NoPrecision;8489break;8490case glslang::EOpStencilAttachmentReadEXT:8491builder.addExtension(spv::E_SPV_EXT_shader_tile_image);8492builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);8493unaryOp = spv::Op::OpStencilAttachmentReadEXT;8494decorations.precision = spv::Decoration::RelaxedPrecision;8495break;84968497default:8498return 0;8499}85008501spv::Id id;8502if (libCall >= 0) {8503std::vector<spv::Id> args;8504args.push_back(operand);8505id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, args);8506} else {8507id = builder.createUnaryOp(unaryOp, typeId, operand);8508}85098510decorations.addNoContraction(builder, id);8511decorations.addNonUniform(builder, id);8512return builder.setPrecision(id, decorations.precision);8513}85148515// Create a unary operation on a matrix8516spv::Id TGlslangToSpvTraverser::createUnaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,8517spv::Id operand, glslang::TBasicType /* typeProxy */)8518{8519// Handle unary operations vector by vector.8520// The result type is the same type as the original type.8521// The algorithm is to:8522// - break the matrix into vectors8523// - apply the operation to each vector8524// - make a matrix out the vector results85258526// get the types sorted out8527int numCols = builder.getNumColumns(operand);8528int numRows = builder.getNumRows(operand);8529spv::Id srcVecType = builder.makeVectorType(builder.getScalarTypeId(builder.getTypeId(operand)), numRows);8530spv::Id destVecType = builder.makeVectorType(builder.getScalarTypeId(typeId), numRows);8531std::vector<spv::Id> results;85328533// do each vector op8534for (int c = 0; c < numCols; ++c) {8535std::vector<unsigned int> indexes;8536indexes.push_back(c);8537spv::Id srcVec = builder.createCompositeExtract(operand, srcVecType, indexes);8538spv::Id destVec = builder.createUnaryOp(op, destVecType, srcVec);8539decorations.addNoContraction(builder, destVec);8540decorations.addNonUniform(builder, destVec);8541results.push_back(builder.setPrecision(destVec, decorations.precision));8542}85438544// put the pieces together8545spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);8546decorations.addNonUniform(builder, result);8547return result;8548}85498550// For converting integers where both the bitwidth and the signedness could8551// change, but only do the width change here. The caller is still responsible8552// for the signedness conversion.8553// destType is the final type that will be converted to, but this function8554// may only be doing part of that conversion.8555spv::Id TGlslangToSpvTraverser::createIntWidthConversion(spv::Id operand, int vectorSize, spv::Id destType,8556glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType)8557{8558// Get the result type width, based on the type to convert to.8559int width = GetNumBits(resultBasicType);85608561// Get the conversion operation and result type,8562// based on the target width, but the source type.8563spv::Id type = spv::NoType;8564spv::Op convOp = spv::Op::OpNop;8565if (isTypeSignedInt(operandBasicType)) {8566convOp = spv::Op::OpSConvert;8567type = builder.makeIntType(width);8568} else {8569convOp = spv::Op::OpUConvert;8570type = builder.makeUintType(width);8571}85728573if (builder.getOpCode(destType) == spv::Op::OpTypeCooperativeVectorNV) {8574type = builder.makeCooperativeVectorTypeNV(type, builder.getCooperativeVectorNumComponents(destType));8575} else if (vectorSize > 0)8576type = builder.makeVectorType(type, vectorSize);8577else if (builder.getOpCode(destType) == spv::Op::OpTypeCooperativeMatrixKHR ||8578builder.getOpCode(destType) == spv::Op::OpTypeCooperativeMatrixNV) {85798580type = builder.makeCooperativeMatrixTypeWithSameShape(type, destType);8581}85828583return builder.createUnaryOp(convOp, type, operand);8584}85858586spv::Id TGlslangToSpvTraverser::createConversion(glslang::TOperator op, OpDecorations& decorations, spv::Id destType,8587spv::Id operand, glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType)8588{8589spv::Op convOp = spv::Op::OpNop;8590spv::Id zero = 0;8591spv::Id one = 0;85928593int vectorSize = builder.isVectorType(destType) ? builder.getNumTypeComponents(destType) : 0;85948595if (IsOpNumericConv(op) || op == glslang::EOpConstructSaturated) {8596if (isTypeSignedInt(operandBasicType) && isTypeFloat(resultBasicType)) {8597convOp = spv::Op::OpConvertSToF;8598}8599if (isTypeUnsignedInt(operandBasicType) && isTypeFloat(resultBasicType)) {8600convOp = spv::Op::OpConvertUToF;8601}8602if (isTypeFloat(operandBasicType) && isTypeSignedInt(resultBasicType)) {8603convOp = spv::Op::OpConvertFToS;8604}8605if (isTypeFloat(operandBasicType) && isTypeUnsignedInt(resultBasicType)) {8606convOp = spv::Op::OpConvertFToU;8607}8608if (isTypeSignedInt(operandBasicType) && isTypeSignedInt(resultBasicType)) {8609convOp = spv::Op::OpSConvert;8610}8611if (isTypeUnsignedInt(operandBasicType) && isTypeUnsignedInt(resultBasicType)) {8612convOp = spv::Op::OpUConvert;8613}8614if (isTypeFloat(operandBasicType) && isTypeFloat(resultBasicType)) {8615convOp = spv::Op::OpFConvert;8616if (builder.isMatrixType(destType))8617return createUnaryMatrixOperation(convOp, decorations, destType, operand, operandBasicType);8618}8619if (isTypeInt(operandBasicType) && isTypeInt(resultBasicType) &&8620isTypeUnsignedInt(operandBasicType) != isTypeUnsignedInt(resultBasicType)) {86218622if (GetNumBits(operandBasicType) != GetNumBits(resultBasicType)) {8623// OpSConvert/OpUConvert + OpBitCast8624operand = createIntWidthConversion(operand, vectorSize, destType, resultBasicType, operandBasicType);8625}86268627if (builder.isInSpecConstCodeGenMode()) {8628uint32_t bits = GetNumBits(resultBasicType);8629spv::Id zeroType = builder.makeUintType(bits);8630if (bits == 64) {8631zero = builder.makeInt64Constant(zeroType, 0, false);8632} else {8633zero = builder.makeIntConstant(zeroType, 0, false);8634}8635zero = makeSmearedConstant(zero, vectorSize);8636// Use OpIAdd, instead of OpBitcast to do the conversion when8637// generating for OpSpecConstantOp instruction.8638return builder.createBinOp(spv::Op::OpIAdd, destType, operand, zero);8639}8640// For normal run-time conversion instruction, use OpBitcast.8641convOp = spv::Op::OpBitcast;8642}8643if (resultBasicType == glslang::EbtBool) {8644uint32_t bits = GetNumBits(operandBasicType);8645if (isTypeInt(operandBasicType)) {8646spv::Id zeroType = builder.makeUintType(bits);8647if (bits == 64) {8648zero = builder.makeInt64Constant(zeroType, 0, false);8649} else {8650zero = builder.makeIntConstant(zeroType, 0, false);8651}8652zero = makeSmearedConstant(zero, vectorSize);8653return builder.createBinOp(spv::Op::OpINotEqual, destType, operand, zero);8654} else {8655assert(isTypeFloat(operandBasicType));8656if (bits == 64) {8657zero = builder.makeDoubleConstant(0.0);8658} else if (bits == 32) {8659zero = builder.makeFloatConstant(0.0);8660} else {8661assert(bits == 16);8662zero = builder.makeFloat16Constant(0.0);8663}8664zero = makeSmearedConstant(zero, vectorSize);8665return builder.createBinOp(spv::Op::OpFUnordNotEqual, destType, operand, zero);8666}8667}8668if (operandBasicType == glslang::EbtBool) {8669uint32_t bits = GetNumBits(resultBasicType);8670convOp = spv::Op::OpSelect;8671if (isTypeInt(resultBasicType)) {8672spv::Id zeroType = isTypeSignedInt(resultBasicType) ? builder.makeIntType(bits) : builder.makeUintType(bits);8673if (bits == 64) {8674zero = builder.makeInt64Constant(zeroType, 0, false);8675one = builder.makeInt64Constant(zeroType, 1, false);8676} else {8677zero = builder.makeIntConstant(zeroType, 0, false);8678one = builder.makeIntConstant(zeroType, 1, false);8679}8680} else {8681assert(isTypeFloat(resultBasicType));8682if (bits == 64) {8683zero = builder.makeDoubleConstant(0.0);8684one = builder.makeDoubleConstant(1.0);8685} else if (bits == 32) {8686zero = builder.makeFloatConstant(0.0);8687one = builder.makeFloatConstant(1.0);8688} else {8689assert(bits == 16);8690zero = builder.makeFloat16Constant(0.0);8691one = builder.makeFloat16Constant(1.0);8692}8693}8694}8695}86968697if (convOp == spv::Op::OpNop) {8698switch (op) {8699case glslang::EOpConvUint64ToPtr:8700convOp = spv::Op::OpConvertUToPtr;8701break;8702case glslang::EOpConvPtrToUint64:8703convOp = spv::Op::OpConvertPtrToU;8704break;8705case glslang::EOpConvPtrToUvec2:8706case glslang::EOpConvUvec2ToPtr:8707convOp = spv::Op::OpBitcast;8708break;87098710default:8711break;8712}8713}87148715spv::Id result = 0;8716if (convOp == spv::Op::OpNop)8717return result;87188719if (convOp == spv::Op::OpSelect) {8720zero = makeSmearedConstant(zero, vectorSize);8721one = makeSmearedConstant(one, vectorSize);8722result = builder.createTriOp(convOp, destType, operand, one, zero);8723} else8724result = builder.createUnaryOp(convOp, destType, operand);87258726result = builder.setPrecision(result, decorations.precision);8727decorations.addNonUniform(builder, result);8728return result;8729}87308731spv::Id TGlslangToSpvTraverser::makeSmearedConstant(spv::Id constant, int vectorSize)8732{8733if (vectorSize == 0)8734return constant;87358736spv::Id vectorTypeId = builder.makeVectorType(builder.getTypeId(constant), vectorSize);8737std::vector<spv::Id> components;8738for (int c = 0; c < vectorSize; ++c)8739components.push_back(constant);8740return builder.makeCompositeConstant(vectorTypeId, components);8741}87428743// For glslang ops that map to SPV atomic opCodes8744spv::Id TGlslangToSpvTraverser::createAtomicOperation(glslang::TOperator op, spv::Decoration /*precision*/,8745spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy,8746const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags, const glslang::TType &opType)8747{8748spv::Op opCode = spv::Op::OpNop;87498750switch (op) {8751case glslang::EOpAtomicAdd:8752case glslang::EOpImageAtomicAdd:8753case glslang::EOpAtomicCounterAdd:8754opCode = spv::Op::OpAtomicIAdd;8755if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {8756opCode = spv::Op::OpAtomicFAddEXT;8757if (typeProxy == glslang::EbtFloat16 &&8758(opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {8759builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);8760builder.addCapability(spv::Capability::AtomicFloat16VectorNV);8761} else {8762builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_add);8763if (typeProxy == glslang::EbtFloat16) {8764builder.addExtension(spv::E_SPV_EXT_shader_atomic_float16_add);8765builder.addCapability(spv::Capability::AtomicFloat16AddEXT);8766} else if (typeProxy == glslang::EbtFloat) {8767builder.addCapability(spv::Capability::AtomicFloat32AddEXT);8768} else {8769builder.addCapability(spv::Capability::AtomicFloat64AddEXT);8770}8771}8772}8773break;8774case glslang::EOpAtomicSubtract:8775case glslang::EOpAtomicCounterSubtract:8776opCode = spv::Op::OpAtomicISub;8777break;8778case glslang::EOpAtomicMin:8779case glslang::EOpImageAtomicMin:8780case glslang::EOpAtomicCounterMin:8781if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {8782opCode = spv::Op::OpAtomicFMinEXT;8783if (typeProxy == glslang::EbtFloat16 &&8784(opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {8785builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);8786builder.addCapability(spv::Capability::AtomicFloat16VectorNV);8787} else {8788builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_min_max);8789if (typeProxy == glslang::EbtFloat16)8790builder.addCapability(spv::Capability::AtomicFloat16MinMaxEXT);8791else if (typeProxy == glslang::EbtFloat)8792builder.addCapability(spv::Capability::AtomicFloat32MinMaxEXT);8793else8794builder.addCapability(spv::Capability::AtomicFloat64MinMaxEXT);8795}8796} else if (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) {8797opCode = spv::Op::OpAtomicUMin;8798} else {8799opCode = spv::Op::OpAtomicSMin;8800}8801break;8802case glslang::EOpAtomicMax:8803case glslang::EOpImageAtomicMax:8804case glslang::EOpAtomicCounterMax:8805if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {8806opCode = spv::Op::OpAtomicFMaxEXT;8807if (typeProxy == glslang::EbtFloat16 &&8808(opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {8809builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);8810builder.addCapability(spv::Capability::AtomicFloat16VectorNV);8811} else {8812builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_min_max);8813if (typeProxy == glslang::EbtFloat16)8814builder.addCapability(spv::Capability::AtomicFloat16MinMaxEXT);8815else if (typeProxy == glslang::EbtFloat)8816builder.addCapability(spv::Capability::AtomicFloat32MinMaxEXT);8817else8818builder.addCapability(spv::Capability::AtomicFloat64MinMaxEXT);8819}8820} else if (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) {8821opCode = spv::Op::OpAtomicUMax;8822} else {8823opCode = spv::Op::OpAtomicSMax;8824}8825break;8826case glslang::EOpAtomicAnd:8827case glslang::EOpImageAtomicAnd:8828case glslang::EOpAtomicCounterAnd:8829opCode = spv::Op::OpAtomicAnd;8830break;8831case glslang::EOpAtomicOr:8832case glslang::EOpImageAtomicOr:8833case glslang::EOpAtomicCounterOr:8834opCode = spv::Op::OpAtomicOr;8835break;8836case glslang::EOpAtomicXor:8837case glslang::EOpImageAtomicXor:8838case glslang::EOpAtomicCounterXor:8839opCode = spv::Op::OpAtomicXor;8840break;8841case glslang::EOpAtomicExchange:8842case glslang::EOpImageAtomicExchange:8843case glslang::EOpAtomicCounterExchange:8844if ((typeProxy == glslang::EbtFloat16) &&8845(opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {8846builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);8847builder.addCapability(spv::Capability::AtomicFloat16VectorNV);8848}88498850opCode = spv::Op::OpAtomicExchange;8851break;8852case glslang::EOpAtomicCompSwap:8853case glslang::EOpImageAtomicCompSwap:8854case glslang::EOpAtomicCounterCompSwap:8855opCode = spv::Op::OpAtomicCompareExchange;8856break;8857case glslang::EOpAtomicCounterIncrement:8858opCode = spv::Op::OpAtomicIIncrement;8859break;8860case glslang::EOpAtomicCounterDecrement:8861opCode = spv::Op::OpAtomicIDecrement;8862break;8863case glslang::EOpAtomicCounter:8864case glslang::EOpImageAtomicLoad:8865case glslang::EOpAtomicLoad:8866opCode = spv::Op::OpAtomicLoad;8867break;8868case glslang::EOpAtomicStore:8869case glslang::EOpImageAtomicStore:8870opCode = spv::Op::OpAtomicStore;8871break;8872default:8873assert(0);8874break;8875}88768877if (typeProxy == glslang::EbtInt64 || typeProxy == glslang::EbtUint64)8878builder.addCapability(spv::Capability::Int64Atomics);88798880// Sort out the operands8881// - mapping from glslang -> SPV8882// - there are extra SPV operands that are optional in glslang8883// - compare-exchange swaps the value and comparator8884// - compare-exchange has an extra memory semantics8885// - EOpAtomicCounterDecrement needs a post decrement8886spv::Id pointerId = 0, compareId = 0, valueId = 0;8887// scope defaults to Device in the old model, QueueFamilyKHR in the new model8888spv::Id scopeId;8889if (glslangIntermediate->usingVulkanMemoryModel()) {8890scopeId = builder.makeUintConstant(spv::Scope::QueueFamilyKHR);8891} else {8892scopeId = builder.makeUintConstant(spv::Scope::Device);8893}8894// semantics default to relaxed8895spv::Id semanticsId = builder.makeUintConstant(lvalueCoherentFlags.isVolatile() &&8896glslangIntermediate->usingVulkanMemoryModel() ?8897spv::MemorySemanticsMask::Volatile :8898spv::MemorySemanticsMask::MaskNone);8899spv::Id semanticsId2 = semanticsId;89008901pointerId = operands[0];8902if (opCode == spv::Op::OpAtomicIIncrement || opCode == spv::Op::OpAtomicIDecrement) {8903// no additional operands8904} else if (opCode == spv::Op::OpAtomicCompareExchange) {8905compareId = operands[1];8906valueId = operands[2];8907if (operands.size() > 3) {8908scopeId = operands[3];8909semanticsId = builder.makeUintConstant(8910builder.getConstantScalar(operands[4]) | builder.getConstantScalar(operands[5]));8911semanticsId2 = builder.makeUintConstant(8912builder.getConstantScalar(operands[6]) | builder.getConstantScalar(operands[7]));8913}8914} else if (opCode == spv::Op::OpAtomicLoad) {8915if (operands.size() > 1) {8916scopeId = operands[1];8917semanticsId = builder.makeUintConstant(8918builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));8919}8920} else {8921// atomic store or RMW8922valueId = operands[1];8923if (operands.size() > 2) {8924scopeId = operands[2];8925semanticsId = builder.makeUintConstant8926(builder.getConstantScalar(operands[3]) | builder.getConstantScalar(operands[4]));8927}8928}89298930// Check for capabilities8931auto const semanticsImmediate = (spv::MemorySemanticsMask)(builder.getConstantScalar(semanticsId) | builder.getConstantScalar(semanticsId2));8932if (anySet(semanticsImmediate, spv::MemorySemanticsMask::MakeAvailableKHR |8933spv::MemorySemanticsMask::MakeVisibleKHR |8934spv::MemorySemanticsMask::OutputMemoryKHR |8935spv::MemorySemanticsMask::Volatile)) {8936builder.addCapability(spv::Capability::VulkanMemoryModelKHR);8937}89388939auto const scope = (spv::Scope)builder.getConstantScalar(scopeId);8940if (scope == spv::Scope::QueueFamily) {8941builder.addCapability(spv::Capability::VulkanMemoryModelKHR);8942}89438944if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::Scope::Device) {8945builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);8946}89478948std::vector<spv::Id> spvAtomicOperands; // hold the spv operands8949spvAtomicOperands.reserve(6);8950spvAtomicOperands.push_back(pointerId);8951spvAtomicOperands.push_back(scopeId);8952spvAtomicOperands.push_back(semanticsId);8953if (opCode == spv::Op::OpAtomicCompareExchange) {8954spvAtomicOperands.push_back(semanticsId2);8955spvAtomicOperands.push_back(valueId);8956spvAtomicOperands.push_back(compareId);8957} else if (opCode != spv::Op::OpAtomicLoad && opCode != spv::Op::OpAtomicIIncrement && opCode != spv::Op::OpAtomicIDecrement) {8958spvAtomicOperands.push_back(valueId);8959}89608961if (opCode == spv::Op::OpAtomicStore) {8962builder.createNoResultOp(opCode, spvAtomicOperands);8963return 0;8964} else {8965spv::Id resultId = builder.createOp(opCode, typeId, spvAtomicOperands);89668967// GLSL and HLSL atomic-counter decrement return post-decrement value,8968// while SPIR-V returns pre-decrement value. Translate between these semantics.8969if (op == glslang::EOpAtomicCounterDecrement)8970resultId = builder.createBinOp(spv::Op::OpISub, typeId, resultId, builder.makeIntConstant(1));89718972return resultId;8973}8974}89758976// Create group invocation operations.8977spv::Id TGlslangToSpvTraverser::createInvocationsOperation(glslang::TOperator op, spv::Id typeId,8978std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)8979{8980bool isUnsigned = isTypeUnsignedInt(typeProxy);8981bool isFloat = isTypeFloat(typeProxy);89828983spv::Op opCode = spv::Op::OpNop;8984std::vector<spv::IdImmediate> spvGroupOperands;8985spv::GroupOperation groupOperation = spv::GroupOperation::Max;89868987if (op == glslang::EOpBallot || op == glslang::EOpReadFirstInvocation ||8988op == glslang::EOpReadInvocation) {8989builder.addExtension(spv::E_SPV_KHR_shader_ballot);8990builder.addCapability(spv::Capability::SubgroupBallotKHR);8991} else if (op == glslang::EOpAnyInvocation ||8992op == glslang::EOpAllInvocations ||8993op == glslang::EOpAllInvocationsEqual) {8994builder.addExtension(spv::E_SPV_KHR_subgroup_vote);8995builder.addCapability(spv::Capability::SubgroupVoteKHR);8996} else {8997builder.addCapability(spv::Capability::Groups);8998if (op == glslang::EOpMinInvocationsNonUniform ||8999op == glslang::EOpMaxInvocationsNonUniform ||9000op == glslang::EOpAddInvocationsNonUniform ||9001op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||9002op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||9003op == glslang::EOpAddInvocationsInclusiveScanNonUniform ||9004op == glslang::EOpMinInvocationsExclusiveScanNonUniform ||9005op == glslang::EOpMaxInvocationsExclusiveScanNonUniform ||9006op == glslang::EOpAddInvocationsExclusiveScanNonUniform)9007builder.addExtension(spv::E_SPV_AMD_shader_ballot);90089009switch (op) {9010case glslang::EOpMinInvocations:9011case glslang::EOpMaxInvocations:9012case glslang::EOpAddInvocations:9013case glslang::EOpMinInvocationsNonUniform:9014case glslang::EOpMaxInvocationsNonUniform:9015case glslang::EOpAddInvocationsNonUniform:9016groupOperation = spv::GroupOperation::Reduce;9017break;9018case glslang::EOpMinInvocationsInclusiveScan:9019case glslang::EOpMaxInvocationsInclusiveScan:9020case glslang::EOpAddInvocationsInclusiveScan:9021case glslang::EOpMinInvocationsInclusiveScanNonUniform:9022case glslang::EOpMaxInvocationsInclusiveScanNonUniform:9023case glslang::EOpAddInvocationsInclusiveScanNonUniform:9024groupOperation = spv::GroupOperation::InclusiveScan;9025break;9026case glslang::EOpMinInvocationsExclusiveScan:9027case glslang::EOpMaxInvocationsExclusiveScan:9028case glslang::EOpAddInvocationsExclusiveScan:9029case glslang::EOpMinInvocationsExclusiveScanNonUniform:9030case glslang::EOpMaxInvocationsExclusiveScanNonUniform:9031case glslang::EOpAddInvocationsExclusiveScanNonUniform:9032groupOperation = spv::GroupOperation::ExclusiveScan;9033break;9034default:9035break;9036}9037spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };9038spvGroupOperands.push_back(scope);9039if (groupOperation != spv::GroupOperation::Max) {9040spv::IdImmediate groupOp = { false, (unsigned)groupOperation };9041spvGroupOperands.push_back(groupOp);9042}9043}90449045for (auto opIt = operands.begin(); opIt != operands.end(); ++opIt) {9046spv::IdImmediate op = { true, *opIt };9047spvGroupOperands.push_back(op);9048}90499050switch (op) {9051case glslang::EOpAnyInvocation:9052opCode = spv::Op::OpSubgroupAnyKHR;9053break;9054case glslang::EOpAllInvocations:9055opCode = spv::Op::OpSubgroupAllKHR;9056break;9057case glslang::EOpAllInvocationsEqual:9058opCode = spv::Op::OpSubgroupAllEqualKHR;9059break;9060case glslang::EOpReadInvocation:9061opCode = spv::Op::OpSubgroupReadInvocationKHR;9062if (builder.isVectorType(typeId))9063return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);9064break;9065case glslang::EOpReadFirstInvocation:9066opCode = spv::Op::OpSubgroupFirstInvocationKHR;9067if (builder.isVectorType(typeId))9068return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);9069break;9070case glslang::EOpBallot:9071{9072// NOTE: According to the spec, the result type of "OpSubgroupBallotKHR" must be a 4 component vector of 329073// bit integer types. The GLSL built-in function "ballotARB()" assumes the maximum number of invocations in9074// a subgroup is 64. Thus, we have to convert uvec4.xy to uint64_t as follow:9075//9076// result = Bitcast(SubgroupBallotKHR(Predicate).xy)9077//9078spv::Id uintType = builder.makeUintType(32);9079spv::Id uvec4Type = builder.makeVectorType(uintType, 4);9080spv::Id result = builder.createOp(spv::Op::OpSubgroupBallotKHR, uvec4Type, spvGroupOperands);90819082std::vector<spv::Id> components;9083components.push_back(builder.createCompositeExtract(result, uintType, 0));9084components.push_back(builder.createCompositeExtract(result, uintType, 1));90859086spv::Id uvec2Type = builder.makeVectorType(uintType, 2);9087return builder.createUnaryOp(spv::Op::OpBitcast, typeId,9088builder.createCompositeConstruct(uvec2Type, components));9089}90909091case glslang::EOpMinInvocations:9092case glslang::EOpMaxInvocations:9093case glslang::EOpAddInvocations:9094case glslang::EOpMinInvocationsInclusiveScan:9095case glslang::EOpMaxInvocationsInclusiveScan:9096case glslang::EOpAddInvocationsInclusiveScan:9097case glslang::EOpMinInvocationsExclusiveScan:9098case glslang::EOpMaxInvocationsExclusiveScan:9099case glslang::EOpAddInvocationsExclusiveScan:9100if (op == glslang::EOpMinInvocations ||9101op == glslang::EOpMinInvocationsInclusiveScan ||9102op == glslang::EOpMinInvocationsExclusiveScan) {9103if (isFloat)9104opCode = spv::Op::OpGroupFMin;9105else {9106if (isUnsigned)9107opCode = spv::Op::OpGroupUMin;9108else9109opCode = spv::Op::OpGroupSMin;9110}9111} else if (op == glslang::EOpMaxInvocations ||9112op == glslang::EOpMaxInvocationsInclusiveScan ||9113op == glslang::EOpMaxInvocationsExclusiveScan) {9114if (isFloat)9115opCode = spv::Op::OpGroupFMax;9116else {9117if (isUnsigned)9118opCode = spv::Op::OpGroupUMax;9119else9120opCode = spv::Op::OpGroupSMax;9121}9122} else {9123if (isFloat)9124opCode = spv::Op::OpGroupFAdd;9125else9126opCode = spv::Op::OpGroupIAdd;9127}91289129if (builder.isVectorType(typeId))9130return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);91319132break;9133case glslang::EOpMinInvocationsNonUniform:9134case glslang::EOpMaxInvocationsNonUniform:9135case glslang::EOpAddInvocationsNonUniform:9136case glslang::EOpMinInvocationsInclusiveScanNonUniform:9137case glslang::EOpMaxInvocationsInclusiveScanNonUniform:9138case glslang::EOpAddInvocationsInclusiveScanNonUniform:9139case glslang::EOpMinInvocationsExclusiveScanNonUniform:9140case glslang::EOpMaxInvocationsExclusiveScanNonUniform:9141case glslang::EOpAddInvocationsExclusiveScanNonUniform:9142if (op == glslang::EOpMinInvocationsNonUniform ||9143op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||9144op == glslang::EOpMinInvocationsExclusiveScanNonUniform) {9145if (isFloat)9146opCode = spv::Op::OpGroupFMinNonUniformAMD;9147else {9148if (isUnsigned)9149opCode = spv::Op::OpGroupUMinNonUniformAMD;9150else9151opCode = spv::Op::OpGroupSMinNonUniformAMD;9152}9153}9154else if (op == glslang::EOpMaxInvocationsNonUniform ||9155op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||9156op == glslang::EOpMaxInvocationsExclusiveScanNonUniform) {9157if (isFloat)9158opCode = spv::Op::OpGroupFMaxNonUniformAMD;9159else {9160if (isUnsigned)9161opCode = spv::Op::OpGroupUMaxNonUniformAMD;9162else9163opCode = spv::Op::OpGroupSMaxNonUniformAMD;9164}9165}9166else {9167if (isFloat)9168opCode = spv::Op::OpGroupFAddNonUniformAMD;9169else9170opCode = spv::Op::OpGroupIAddNonUniformAMD;9171}91729173if (builder.isVectorType(typeId))9174return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);91759176break;9177default:9178logger->missingFunctionality("invocation operation");9179return spv::NoResult;9180}91819182assert(opCode != spv::Op::OpNop);9183return builder.createOp(opCode, typeId, spvGroupOperands);9184}91859186// Create group invocation operations on a vector9187spv::Id TGlslangToSpvTraverser::CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,9188spv::Id typeId, std::vector<spv::Id>& operands)9189{9190assert(op == spv::Op::OpGroupFMin || op == spv::Op::OpGroupUMin || op == spv::Op::OpGroupSMin ||9191op == spv::Op::OpGroupFMax || op == spv::Op::OpGroupUMax || op == spv::Op::OpGroupSMax ||9192op == spv::Op::OpGroupFAdd || op == spv::Op::OpGroupIAdd || op == spv::Op::OpGroupBroadcast ||9193op == spv::Op::OpSubgroupReadInvocationKHR || op == spv::Op::OpSubgroupFirstInvocationKHR ||9194op == spv::Op::OpGroupFMinNonUniformAMD || op == spv::Op::OpGroupUMinNonUniformAMD ||9195op == spv::Op::OpGroupSMinNonUniformAMD ||9196op == spv::Op::OpGroupFMaxNonUniformAMD || op == spv::Op::OpGroupUMaxNonUniformAMD ||9197op == spv::Op::OpGroupSMaxNonUniformAMD ||9198op == spv::Op::OpGroupFAddNonUniformAMD || op == spv::Op::OpGroupIAddNonUniformAMD);91999200// Handle group invocation operations scalar by scalar.9201// The result type is the same type as the original type.9202// The algorithm is to:9203// - break the vector into scalars9204// - apply the operation to each scalar9205// - make a vector out the scalar results92069207// get the types sorted out9208int numComponents = builder.getNumComponents(operands[0]);9209spv::Id scalarType = builder.getScalarTypeId(builder.getTypeId(operands[0]));9210std::vector<spv::Id> results;92119212// do each scalar op9213for (int comp = 0; comp < numComponents; ++comp) {9214std::vector<unsigned int> indexes;9215indexes.push_back(comp);9216spv::IdImmediate scalar = { true, builder.createCompositeExtract(operands[0], scalarType, indexes) };9217std::vector<spv::IdImmediate> spvGroupOperands;9218if (op == spv::Op::OpSubgroupReadInvocationKHR) {9219spvGroupOperands.push_back(scalar);9220spv::IdImmediate operand = { true, operands[1] };9221spvGroupOperands.push_back(operand);9222} else if (op == spv::Op::OpSubgroupFirstInvocationKHR) {9223spvGroupOperands.push_back(scalar);9224} else if (op == spv::Op::OpGroupBroadcast) {9225spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };9226spvGroupOperands.push_back(scope);9227spvGroupOperands.push_back(scalar);9228spv::IdImmediate operand = { true, operands[1] };9229spvGroupOperands.push_back(operand);9230} else {9231spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };9232spvGroupOperands.push_back(scope);9233spv::IdImmediate groupOp = { false, (unsigned)groupOperation };9234spvGroupOperands.push_back(groupOp);9235spvGroupOperands.push_back(scalar);9236}92379238results.push_back(builder.createOp(op, scalarType, spvGroupOperands));9239}92409241// put the pieces together9242return builder.createCompositeConstruct(typeId, results);9243}92449245// Create subgroup invocation operations.9246spv::Id TGlslangToSpvTraverser::createSubgroupOperation(glslang::TOperator op, spv::Id typeId,9247std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)9248{9249// Add the required capabilities.9250switch (op) {9251case glslang::EOpSubgroupElect:9252builder.addCapability(spv::Capability::GroupNonUniform);9253break;9254case glslang::EOpSubgroupQuadAll:9255case glslang::EOpSubgroupQuadAny:9256builder.addExtension(spv::E_SPV_KHR_quad_control);9257builder.addCapability(spv::Capability::QuadControlKHR);9258[[fallthrough]];9259case glslang::EOpSubgroupAll:9260case glslang::EOpSubgroupAny:9261case glslang::EOpSubgroupAllEqual:9262builder.addCapability(spv::Capability::GroupNonUniform);9263builder.addCapability(spv::Capability::GroupNonUniformVote);9264break;9265case glslang::EOpSubgroupBroadcast:9266case glslang::EOpSubgroupBroadcastFirst:9267case glslang::EOpSubgroupBallot:9268case glslang::EOpSubgroupInverseBallot:9269case glslang::EOpSubgroupBallotBitExtract:9270case glslang::EOpSubgroupBallotBitCount:9271case glslang::EOpSubgroupBallotInclusiveBitCount:9272case glslang::EOpSubgroupBallotExclusiveBitCount:9273case glslang::EOpSubgroupBallotFindLSB:9274case glslang::EOpSubgroupBallotFindMSB:9275builder.addCapability(spv::Capability::GroupNonUniform);9276builder.addCapability(spv::Capability::GroupNonUniformBallot);9277break;9278case glslang::EOpSubgroupRotate:9279case glslang::EOpSubgroupClusteredRotate:9280builder.addExtension(spv::E_SPV_KHR_subgroup_rotate);9281builder.addCapability(spv::Capability::GroupNonUniformRotateKHR);9282break;9283case glslang::EOpSubgroupShuffle:9284case glslang::EOpSubgroupShuffleXor:9285builder.addCapability(spv::Capability::GroupNonUniform);9286builder.addCapability(spv::Capability::GroupNonUniformShuffle);9287break;9288case glslang::EOpSubgroupShuffleUp:9289case glslang::EOpSubgroupShuffleDown:9290builder.addCapability(spv::Capability::GroupNonUniform);9291builder.addCapability(spv::Capability::GroupNonUniformShuffleRelative);9292break;9293case glslang::EOpSubgroupAdd:9294case glslang::EOpSubgroupMul:9295case glslang::EOpSubgroupMin:9296case glslang::EOpSubgroupMax:9297case glslang::EOpSubgroupAnd:9298case glslang::EOpSubgroupOr:9299case glslang::EOpSubgroupXor:9300case glslang::EOpSubgroupInclusiveAdd:9301case glslang::EOpSubgroupInclusiveMul:9302case glslang::EOpSubgroupInclusiveMin:9303case glslang::EOpSubgroupInclusiveMax:9304case glslang::EOpSubgroupInclusiveAnd:9305case glslang::EOpSubgroupInclusiveOr:9306case glslang::EOpSubgroupInclusiveXor:9307case glslang::EOpSubgroupExclusiveAdd:9308case glslang::EOpSubgroupExclusiveMul:9309case glslang::EOpSubgroupExclusiveMin:9310case glslang::EOpSubgroupExclusiveMax:9311case glslang::EOpSubgroupExclusiveAnd:9312case glslang::EOpSubgroupExclusiveOr:9313case glslang::EOpSubgroupExclusiveXor:9314builder.addCapability(spv::Capability::GroupNonUniform);9315builder.addCapability(spv::Capability::GroupNonUniformArithmetic);9316break;9317case glslang::EOpSubgroupClusteredAdd:9318case glslang::EOpSubgroupClusteredMul:9319case glslang::EOpSubgroupClusteredMin:9320case glslang::EOpSubgroupClusteredMax:9321case glslang::EOpSubgroupClusteredAnd:9322case glslang::EOpSubgroupClusteredOr:9323case glslang::EOpSubgroupClusteredXor:9324builder.addCapability(spv::Capability::GroupNonUniform);9325builder.addCapability(spv::Capability::GroupNonUniformClustered);9326break;9327case glslang::EOpSubgroupQuadBroadcast:9328case glslang::EOpSubgroupQuadSwapHorizontal:9329case glslang::EOpSubgroupQuadSwapVertical:9330case glslang::EOpSubgroupQuadSwapDiagonal:9331builder.addCapability(spv::Capability::GroupNonUniform);9332builder.addCapability(spv::Capability::GroupNonUniformQuad);9333break;9334case glslang::EOpSubgroupPartitionedAdd:9335case glslang::EOpSubgroupPartitionedMul:9336case glslang::EOpSubgroupPartitionedMin:9337case glslang::EOpSubgroupPartitionedMax:9338case glslang::EOpSubgroupPartitionedAnd:9339case glslang::EOpSubgroupPartitionedOr:9340case glslang::EOpSubgroupPartitionedXor:9341case glslang::EOpSubgroupPartitionedInclusiveAdd:9342case glslang::EOpSubgroupPartitionedInclusiveMul:9343case glslang::EOpSubgroupPartitionedInclusiveMin:9344case glslang::EOpSubgroupPartitionedInclusiveMax:9345case glslang::EOpSubgroupPartitionedInclusiveAnd:9346case glslang::EOpSubgroupPartitionedInclusiveOr:9347case glslang::EOpSubgroupPartitionedInclusiveXor:9348case glslang::EOpSubgroupPartitionedExclusiveAdd:9349case glslang::EOpSubgroupPartitionedExclusiveMul:9350case glslang::EOpSubgroupPartitionedExclusiveMin:9351case glslang::EOpSubgroupPartitionedExclusiveMax:9352case glslang::EOpSubgroupPartitionedExclusiveAnd:9353case glslang::EOpSubgroupPartitionedExclusiveOr:9354case glslang::EOpSubgroupPartitionedExclusiveXor:9355builder.addExtension(spv::E_SPV_NV_shader_subgroup_partitioned);9356builder.addCapability(spv::Capability::GroupNonUniformPartitionedNV);9357break;9358default: assert(0 && "Unhandled subgroup operation!");9359}936093619362const bool isUnsigned = isTypeUnsignedInt(typeProxy);9363const bool isFloat = isTypeFloat(typeProxy);9364const bool isBool = typeProxy == glslang::EbtBool;93659366spv::Op opCode = spv::Op::OpNop;93679368// Figure out which opcode to use.9369switch (op) {9370case glslang::EOpSubgroupElect: opCode = spv::Op::OpGroupNonUniformElect; break;9371case glslang::EOpSubgroupQuadAll: opCode = spv::Op::OpGroupNonUniformQuadAllKHR; break;9372case glslang::EOpSubgroupAll: opCode = spv::Op::OpGroupNonUniformAll; break;9373case glslang::EOpSubgroupQuadAny: opCode = spv::Op::OpGroupNonUniformQuadAnyKHR; break;9374case glslang::EOpSubgroupAny: opCode = spv::Op::OpGroupNonUniformAny; break;9375case glslang::EOpSubgroupAllEqual: opCode = spv::Op::OpGroupNonUniformAllEqual; break;9376case glslang::EOpSubgroupBroadcast: opCode = spv::Op::OpGroupNonUniformBroadcast; break;9377case glslang::EOpSubgroupBroadcastFirst: opCode = spv::Op::OpGroupNonUniformBroadcastFirst; break;9378case glslang::EOpSubgroupBallot: opCode = spv::Op::OpGroupNonUniformBallot; break;9379case glslang::EOpSubgroupInverseBallot: opCode = spv::Op::OpGroupNonUniformInverseBallot; break;9380case glslang::EOpSubgroupBallotBitExtract: opCode = spv::Op::OpGroupNonUniformBallotBitExtract; break;9381case glslang::EOpSubgroupBallotBitCount:9382case glslang::EOpSubgroupBallotInclusiveBitCount:9383case glslang::EOpSubgroupBallotExclusiveBitCount: opCode = spv::Op::OpGroupNonUniformBallotBitCount; break;9384case glslang::EOpSubgroupBallotFindLSB: opCode = spv::Op::OpGroupNonUniformBallotFindLSB; break;9385case glslang::EOpSubgroupBallotFindMSB: opCode = spv::Op::OpGroupNonUniformBallotFindMSB; break;9386case glslang::EOpSubgroupShuffle: opCode = spv::Op::OpGroupNonUniformShuffle; break;9387case glslang::EOpSubgroupShuffleXor: opCode = spv::Op::OpGroupNonUniformShuffleXor; break;9388case glslang::EOpSubgroupShuffleUp: opCode = spv::Op::OpGroupNonUniformShuffleUp; break;9389case glslang::EOpSubgroupShuffleDown: opCode = spv::Op::OpGroupNonUniformShuffleDown; break;9390case glslang::EOpSubgroupRotate:9391case glslang::EOpSubgroupClusteredRotate: opCode = spv::Op::OpGroupNonUniformRotateKHR; break;9392case glslang::EOpSubgroupAdd:9393case glslang::EOpSubgroupInclusiveAdd:9394case glslang::EOpSubgroupExclusiveAdd:9395case glslang::EOpSubgroupClusteredAdd:9396case glslang::EOpSubgroupPartitionedAdd:9397case glslang::EOpSubgroupPartitionedInclusiveAdd:9398case glslang::EOpSubgroupPartitionedExclusiveAdd:9399if (isFloat) {9400opCode = spv::Op::OpGroupNonUniformFAdd;9401} else {9402opCode = spv::Op::OpGroupNonUniformIAdd;9403}9404break;9405case glslang::EOpSubgroupMul:9406case glslang::EOpSubgroupInclusiveMul:9407case glslang::EOpSubgroupExclusiveMul:9408case glslang::EOpSubgroupClusteredMul:9409case glslang::EOpSubgroupPartitionedMul:9410case glslang::EOpSubgroupPartitionedInclusiveMul:9411case glslang::EOpSubgroupPartitionedExclusiveMul:9412if (isFloat) {9413opCode = spv::Op::OpGroupNonUniformFMul;9414} else {9415opCode = spv::Op::OpGroupNonUniformIMul;9416}9417break;9418case glslang::EOpSubgroupMin:9419case glslang::EOpSubgroupInclusiveMin:9420case glslang::EOpSubgroupExclusiveMin:9421case glslang::EOpSubgroupClusteredMin:9422case glslang::EOpSubgroupPartitionedMin:9423case glslang::EOpSubgroupPartitionedInclusiveMin:9424case glslang::EOpSubgroupPartitionedExclusiveMin:9425if (isFloat) {9426opCode = spv::Op::OpGroupNonUniformFMin;9427} else if (isUnsigned) {9428opCode = spv::Op::OpGroupNonUniformUMin;9429} else {9430opCode = spv::Op::OpGroupNonUniformSMin;9431}9432break;9433case glslang::EOpSubgroupMax:9434case glslang::EOpSubgroupInclusiveMax:9435case glslang::EOpSubgroupExclusiveMax:9436case glslang::EOpSubgroupClusteredMax:9437case glslang::EOpSubgroupPartitionedMax:9438case glslang::EOpSubgroupPartitionedInclusiveMax:9439case glslang::EOpSubgroupPartitionedExclusiveMax:9440if (isFloat) {9441opCode = spv::Op::OpGroupNonUniformFMax;9442} else if (isUnsigned) {9443opCode = spv::Op::OpGroupNonUniformUMax;9444} else {9445opCode = spv::Op::OpGroupNonUniformSMax;9446}9447break;9448case glslang::EOpSubgroupAnd:9449case glslang::EOpSubgroupInclusiveAnd:9450case glslang::EOpSubgroupExclusiveAnd:9451case glslang::EOpSubgroupClusteredAnd:9452case glslang::EOpSubgroupPartitionedAnd:9453case glslang::EOpSubgroupPartitionedInclusiveAnd:9454case glslang::EOpSubgroupPartitionedExclusiveAnd:9455if (isBool) {9456opCode = spv::Op::OpGroupNonUniformLogicalAnd;9457} else {9458opCode = spv::Op::OpGroupNonUniformBitwiseAnd;9459}9460break;9461case glslang::EOpSubgroupOr:9462case glslang::EOpSubgroupInclusiveOr:9463case glslang::EOpSubgroupExclusiveOr:9464case glslang::EOpSubgroupClusteredOr:9465case glslang::EOpSubgroupPartitionedOr:9466case glslang::EOpSubgroupPartitionedInclusiveOr:9467case glslang::EOpSubgroupPartitionedExclusiveOr:9468if (isBool) {9469opCode = spv::Op::OpGroupNonUniformLogicalOr;9470} else {9471opCode = spv::Op::OpGroupNonUniformBitwiseOr;9472}9473break;9474case glslang::EOpSubgroupXor:9475case glslang::EOpSubgroupInclusiveXor:9476case glslang::EOpSubgroupExclusiveXor:9477case glslang::EOpSubgroupClusteredXor:9478case glslang::EOpSubgroupPartitionedXor:9479case glslang::EOpSubgroupPartitionedInclusiveXor:9480case glslang::EOpSubgroupPartitionedExclusiveXor:9481if (isBool) {9482opCode = spv::Op::OpGroupNonUniformLogicalXor;9483} else {9484opCode = spv::Op::OpGroupNonUniformBitwiseXor;9485}9486break;9487case glslang::EOpSubgroupQuadBroadcast: opCode = spv::Op::OpGroupNonUniformQuadBroadcast; break;9488case glslang::EOpSubgroupQuadSwapHorizontal:9489case glslang::EOpSubgroupQuadSwapVertical:9490case glslang::EOpSubgroupQuadSwapDiagonal: opCode = spv::Op::OpGroupNonUniformQuadSwap; break;9491default: assert(0 && "Unhandled subgroup operation!");9492}94939494// get the right Group Operation9495spv::GroupOperation groupOperation = spv::GroupOperation::Max;9496switch (op) {9497default:9498break;9499case glslang::EOpSubgroupBallotBitCount:9500case glslang::EOpSubgroupAdd:9501case glslang::EOpSubgroupMul:9502case glslang::EOpSubgroupMin:9503case glslang::EOpSubgroupMax:9504case glslang::EOpSubgroupAnd:9505case glslang::EOpSubgroupOr:9506case glslang::EOpSubgroupXor:9507groupOperation = spv::GroupOperation::Reduce;9508break;9509case glslang::EOpSubgroupBallotInclusiveBitCount:9510case glslang::EOpSubgroupInclusiveAdd:9511case glslang::EOpSubgroupInclusiveMul:9512case glslang::EOpSubgroupInclusiveMin:9513case glslang::EOpSubgroupInclusiveMax:9514case glslang::EOpSubgroupInclusiveAnd:9515case glslang::EOpSubgroupInclusiveOr:9516case glslang::EOpSubgroupInclusiveXor:9517groupOperation = spv::GroupOperation::InclusiveScan;9518break;9519case glslang::EOpSubgroupBallotExclusiveBitCount:9520case glslang::EOpSubgroupExclusiveAdd:9521case glslang::EOpSubgroupExclusiveMul:9522case glslang::EOpSubgroupExclusiveMin:9523case glslang::EOpSubgroupExclusiveMax:9524case glslang::EOpSubgroupExclusiveAnd:9525case glslang::EOpSubgroupExclusiveOr:9526case glslang::EOpSubgroupExclusiveXor:9527groupOperation = spv::GroupOperation::ExclusiveScan;9528break;9529case glslang::EOpSubgroupClusteredAdd:9530case glslang::EOpSubgroupClusteredMul:9531case glslang::EOpSubgroupClusteredMin:9532case glslang::EOpSubgroupClusteredMax:9533case glslang::EOpSubgroupClusteredAnd:9534case glslang::EOpSubgroupClusteredOr:9535case glslang::EOpSubgroupClusteredXor:9536groupOperation = spv::GroupOperation::ClusteredReduce;9537break;9538case glslang::EOpSubgroupPartitionedAdd:9539case glslang::EOpSubgroupPartitionedMul:9540case glslang::EOpSubgroupPartitionedMin:9541case glslang::EOpSubgroupPartitionedMax:9542case glslang::EOpSubgroupPartitionedAnd:9543case glslang::EOpSubgroupPartitionedOr:9544case glslang::EOpSubgroupPartitionedXor:9545groupOperation = spv::GroupOperation::PartitionedReduceNV;9546break;9547case glslang::EOpSubgroupPartitionedInclusiveAdd:9548case glslang::EOpSubgroupPartitionedInclusiveMul:9549case glslang::EOpSubgroupPartitionedInclusiveMin:9550case glslang::EOpSubgroupPartitionedInclusiveMax:9551case glslang::EOpSubgroupPartitionedInclusiveAnd:9552case glslang::EOpSubgroupPartitionedInclusiveOr:9553case glslang::EOpSubgroupPartitionedInclusiveXor:9554groupOperation = spv::GroupOperation::PartitionedInclusiveScanNV;9555break;9556case glslang::EOpSubgroupPartitionedExclusiveAdd:9557case glslang::EOpSubgroupPartitionedExclusiveMul:9558case glslang::EOpSubgroupPartitionedExclusiveMin:9559case glslang::EOpSubgroupPartitionedExclusiveMax:9560case glslang::EOpSubgroupPartitionedExclusiveAnd:9561case glslang::EOpSubgroupPartitionedExclusiveOr:9562case glslang::EOpSubgroupPartitionedExclusiveXor:9563groupOperation = spv::GroupOperation::PartitionedExclusiveScanNV;9564break;9565}95669567// build the instruction9568std::vector<spv::IdImmediate> spvGroupOperands;95699570// Every operation begins with the Execution Scope operand.9571spv::IdImmediate executionScope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };9572// All other ops need the execution scope. Quad Control Ops don't need scope, it's always Quad.9573if (opCode != spv::Op::OpGroupNonUniformQuadAllKHR && opCode != spv::Op::OpGroupNonUniformQuadAnyKHR) {9574spvGroupOperands.push_back(executionScope);9575}95769577// Next, for all operations that use a Group Operation, push that as an operand.9578if (groupOperation != spv::GroupOperation::Max) {9579spv::IdImmediate groupOperand = { false, (unsigned)groupOperation };9580spvGroupOperands.push_back(groupOperand);9581}95829583// Push back the operands next.9584for (auto opIt = operands.cbegin(); opIt != operands.cend(); ++opIt) {9585spv::IdImmediate operand = { true, *opIt };9586spvGroupOperands.push_back(operand);9587}95889589// Some opcodes have additional operands.9590spv::Id directionId = spv::NoResult;9591switch (op) {9592default: break;9593case glslang::EOpSubgroupQuadSwapHorizontal: directionId = builder.makeUintConstant(0); break;9594case glslang::EOpSubgroupQuadSwapVertical: directionId = builder.makeUintConstant(1); break;9595case glslang::EOpSubgroupQuadSwapDiagonal: directionId = builder.makeUintConstant(2); break;9596}9597if (directionId != spv::NoResult) {9598spv::IdImmediate direction = { true, directionId };9599spvGroupOperands.push_back(direction);9600}96019602return builder.createOp(opCode, typeId, spvGroupOperands);9603}96049605spv::Id TGlslangToSpvTraverser::createMiscOperation(glslang::TOperator op, spv::Decoration precision,9606spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)9607{9608bool isUnsigned = isTypeUnsignedInt(typeProxy);9609bool isFloat = isTypeFloat(typeProxy);96109611spv::Op opCode = spv::Op::OpNop;9612int extBuiltins = -1;9613int libCall = -1;9614size_t consumedOperands = operands.size();9615spv::Id typeId0 = 0;9616if (consumedOperands > 0)9617typeId0 = builder.getTypeId(operands[0]);9618spv::Id typeId1 = 0;9619if (consumedOperands > 1)9620typeId1 = builder.getTypeId(operands[1]);9621spv::Id frexpIntType = 0;96229623switch (op) {9624case glslang::EOpMin:9625if (isFloat)9626libCall = nanMinMaxClamp ? spv::GLSLstd450NMin : spv::GLSLstd450FMin;9627else if (isUnsigned)9628libCall = spv::GLSLstd450UMin;9629else9630libCall = spv::GLSLstd450SMin;9631builder.promoteScalar(precision, operands.front(), operands.back());9632break;9633case glslang::EOpModf:9634{9635libCall = spv::GLSLstd450ModfStruct;9636assert(builder.isFloatType(builder.getScalarTypeId(typeId0)));9637// The returned struct has two members of the same type as the first argument9638typeId = builder.makeStructResultType(typeId0, typeId0);9639consumedOperands = 1;9640}9641break;9642case glslang::EOpMax:9643if (isFloat)9644libCall = nanMinMaxClamp ? spv::GLSLstd450NMax : spv::GLSLstd450FMax;9645else if (isUnsigned)9646libCall = spv::GLSLstd450UMax;9647else9648libCall = spv::GLSLstd450SMax;9649builder.promoteScalar(precision, operands.front(), operands.back());9650break;9651case glslang::EOpPow:9652libCall = spv::GLSLstd450Pow;9653break;9654case glslang::EOpDot:9655case glslang::EOpDotPackedEXT:9656case glslang::EOpDotAccSatEXT:9657case glslang::EOpDotPackedAccSatEXT:9658{9659if (builder.isFloatType(builder.getScalarTypeId(typeId0)) ||9660// HLSL supports dot(int,int) which is just a multiply9661glslangIntermediate->getSource() == glslang::EShSourceHlsl) {9662if (typeProxy == glslang::EbtBFloat16) {9663builder.addExtension(spv::E_SPV_KHR_bfloat16);9664builder.addCapability(spv::Capability::BFloat16DotProductKHR);9665}9666opCode = spv::Op::OpDot;9667} else {9668builder.addExtension(spv::E_SPV_KHR_integer_dot_product);9669builder.addCapability(spv::Capability::DotProductKHR);9670const unsigned int vectorSize = builder.getNumComponents(operands[0]);9671if (op == glslang::EOpDotPackedEXT || op == glslang::EOpDotPackedAccSatEXT) {9672builder.addCapability(spv::Capability::DotProductInput4x8BitPackedKHR);9673} else if (vectorSize == 4 && builder.getScalarTypeWidth(typeId0) == 8) {9674builder.addCapability(spv::Capability::DotProductInput4x8BitKHR);9675} else {9676builder.addCapability(spv::Capability::DotProductInputAllKHR);9677}9678const bool type0isSigned = builder.isIntType(builder.getScalarTypeId(typeId0));9679const bool type1isSigned = builder.isIntType(builder.getScalarTypeId(typeId1));9680const bool accSat = (op == glslang::EOpDotAccSatEXT || op == glslang::EOpDotPackedAccSatEXT);9681if (!type0isSigned && !type1isSigned) {9682opCode = accSat ? spv::Op::OpUDotAccSatKHR : spv::Op::OpUDotKHR;9683} else if (type0isSigned && type1isSigned) {9684opCode = accSat ? spv::Op::OpSDotAccSatKHR : spv::Op::OpSDotKHR;9685} else {9686opCode = accSat ? spv::Op::OpSUDotAccSatKHR : spv::Op::OpSUDotKHR;9687// the spir-v opcode assumes the operands to be "signed, unsigned" in that order, so swap if needed9688if (type1isSigned) {9689std::swap(operands[0], operands[1]);9690}9691}9692std::vector<spv::IdImmediate> operands2;9693for (auto &o : operands) {9694operands2.push_back({true, o});9695}9696if (op == glslang::EOpDotPackedEXT || op == glslang::EOpDotPackedAccSatEXT) {9697operands2.push_back({false, 0});9698}9699return builder.createOp(opCode, typeId, operands2);9700}9701}9702break;9703case glslang::EOpAtan:9704libCall = spv::GLSLstd450Atan2;9705break;97069707case glslang::EOpClamp:9708if (isFloat)9709libCall = nanMinMaxClamp ? spv::GLSLstd450NClamp : spv::GLSLstd450FClamp;9710else if (isUnsigned)9711libCall = spv::GLSLstd450UClamp;9712else9713libCall = spv::GLSLstd450SClamp;9714builder.promoteScalar(precision, operands.front(), operands[1]);9715builder.promoteScalar(precision, operands.front(), operands[2]);9716break;9717case glslang::EOpMix:9718if (! builder.isBoolType(builder.getScalarTypeId(builder.getTypeId(operands.back())))) {9719assert(isFloat);9720libCall = spv::GLSLstd450FMix;9721} else {9722opCode = spv::Op::OpSelect;9723std::swap(operands.front(), operands.back());9724}9725builder.promoteScalar(precision, operands.front(), operands.back());9726break;9727case glslang::EOpStep:9728libCall = spv::GLSLstd450Step;9729builder.promoteScalar(precision, operands.front(), operands.back());9730break;9731case glslang::EOpSmoothStep:9732libCall = spv::GLSLstd450SmoothStep;9733builder.promoteScalar(precision, operands[0], operands[2]);9734builder.promoteScalar(precision, operands[1], operands[2]);9735break;97369737case glslang::EOpDistance:9738libCall = spv::GLSLstd450Distance;9739break;9740case glslang::EOpCross:9741libCall = spv::GLSLstd450Cross;9742break;9743case glslang::EOpFaceForward:9744libCall = spv::GLSLstd450FaceForward;9745break;9746case glslang::EOpReflect:9747libCall = spv::GLSLstd450Reflect;9748break;9749case glslang::EOpRefract:9750libCall = spv::GLSLstd450Refract;9751break;9752case glslang::EOpBarrier:9753{9754// This is for the extended controlBarrier function, with four operands.9755// The unextended barrier() goes through createNoArgOperation.9756assert(operands.size() == 4);9757auto const executionScope = (spv::Scope)builder.getConstantScalar(operands[0]);9758auto const memoryScope = (spv::Scope)builder.getConstantScalar(operands[1]);9759auto const semantics = (spv::MemorySemanticsMask)(builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));9760builder.createControlBarrier(executionScope, memoryScope,9761semantics);9762if (anySet(semantics, spv::MemorySemanticsMask::MakeAvailableKHR |9763spv::MemorySemanticsMask::MakeVisibleKHR |9764spv::MemorySemanticsMask::OutputMemoryKHR |9765spv::MemorySemanticsMask::Volatile)) {9766builder.addCapability(spv::Capability::VulkanMemoryModelKHR);9767}9768if (glslangIntermediate->usingVulkanMemoryModel() && (executionScope == spv::Scope::Device ||9769memoryScope == spv::Scope::Device)) {9770builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);9771}9772return 0;9773}9774break;9775case glslang::EOpMemoryBarrier:9776{9777// This is for the extended memoryBarrier function, with three operands.9778// The unextended memoryBarrier() goes through createNoArgOperation.9779assert(operands.size() == 3);9780auto const memoryScope = (spv::Scope)builder.getConstantScalar(operands[0]);9781auto const semantics = (spv::MemorySemanticsMask)(builder.getConstantScalar(operands[1]) | builder.getConstantScalar(operands[2]));9782builder.createMemoryBarrier(memoryScope, semantics);9783if (anySet(semantics, spv::MemorySemanticsMask::MakeAvailableKHR |9784spv::MemorySemanticsMask::MakeVisibleKHR |9785spv::MemorySemanticsMask::OutputMemoryKHR |9786spv::MemorySemanticsMask::Volatile)) {9787builder.addCapability(spv::Capability::VulkanMemoryModelKHR);9788}9789if (glslangIntermediate->usingVulkanMemoryModel() && memoryScope == spv::Scope::Device) {9790builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);9791}9792return 0;9793}9794break;97959796case glslang::EOpInterpolateAtSample:9797if (typeProxy == glslang::EbtFloat16)9798builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);9799libCall = spv::GLSLstd450InterpolateAtSample;9800break;9801case glslang::EOpInterpolateAtOffset:9802if (typeProxy == glslang::EbtFloat16)9803builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);9804libCall = spv::GLSLstd450InterpolateAtOffset;9805break;9806case glslang::EOpAddCarry:9807opCode = spv::Op::OpIAddCarry;9808typeId = builder.makeStructResultType(typeId0, typeId0);9809consumedOperands = 2;9810break;9811case glslang::EOpSubBorrow:9812opCode = spv::Op::OpISubBorrow;9813typeId = builder.makeStructResultType(typeId0, typeId0);9814consumedOperands = 2;9815break;9816case glslang::EOpUMulExtended:9817opCode = spv::Op::OpUMulExtended;9818typeId = builder.makeStructResultType(typeId0, typeId0);9819consumedOperands = 2;9820break;9821case glslang::EOpIMulExtended:9822opCode = spv::Op::OpSMulExtended;9823typeId = builder.makeStructResultType(typeId0, typeId0);9824consumedOperands = 2;9825break;9826case glslang::EOpBitfieldExtract:9827if (isUnsigned)9828opCode = spv::Op::OpBitFieldUExtract;9829else9830opCode = spv::Op::OpBitFieldSExtract;9831break;9832case glslang::EOpBitfieldInsert:9833opCode = spv::Op::OpBitFieldInsert;9834break;98359836case glslang::EOpFma:9837libCall = spv::GLSLstd450Fma;9838break;9839case glslang::EOpFrexp:9840{9841libCall = spv::GLSLstd450FrexpStruct;9842assert(builder.isPointerType(typeId1));9843typeId1 = builder.getContainedTypeId(typeId1);9844int width = builder.getScalarTypeWidth(typeId1);9845if (width == 16)9846// Using 16-bit exp operand, enable extension SPV_AMD_gpu_shader_int169847builder.addExtension(spv::E_SPV_AMD_gpu_shader_int16);9848if (builder.getNumComponents(operands[0]) == 1)9849frexpIntType = builder.makeIntegerType(width, true);9850else9851frexpIntType = builder.makeVectorType(builder.makeIntegerType(width, true),9852builder.getNumComponents(operands[0]));9853typeId = builder.makeStructResultType(typeId0, frexpIntType);9854consumedOperands = 1;9855}9856break;9857case glslang::EOpLdexp:9858libCall = spv::GLSLstd450Ldexp;9859break;98609861case glslang::EOpReadInvocation:9862return createInvocationsOperation(op, typeId, operands, typeProxy);98639864case glslang::EOpSubgroupBroadcast:9865case glslang::EOpSubgroupBallotBitExtract:9866case glslang::EOpSubgroupShuffle:9867case glslang::EOpSubgroupShuffleXor:9868case glslang::EOpSubgroupShuffleUp:9869case glslang::EOpSubgroupShuffleDown:9870case glslang::EOpSubgroupRotate:9871case glslang::EOpSubgroupClusteredRotate:9872case glslang::EOpSubgroupClusteredAdd:9873case glslang::EOpSubgroupClusteredMul:9874case glslang::EOpSubgroupClusteredMin:9875case glslang::EOpSubgroupClusteredMax:9876case glslang::EOpSubgroupClusteredAnd:9877case glslang::EOpSubgroupClusteredOr:9878case glslang::EOpSubgroupClusteredXor:9879case glslang::EOpSubgroupQuadBroadcast:9880case glslang::EOpSubgroupPartitionedAdd:9881case glslang::EOpSubgroupPartitionedMul:9882case glslang::EOpSubgroupPartitionedMin:9883case glslang::EOpSubgroupPartitionedMax:9884case glslang::EOpSubgroupPartitionedAnd:9885case glslang::EOpSubgroupPartitionedOr:9886case glslang::EOpSubgroupPartitionedXor:9887case glslang::EOpSubgroupPartitionedInclusiveAdd:9888case glslang::EOpSubgroupPartitionedInclusiveMul:9889case glslang::EOpSubgroupPartitionedInclusiveMin:9890case glslang::EOpSubgroupPartitionedInclusiveMax:9891case glslang::EOpSubgroupPartitionedInclusiveAnd:9892case glslang::EOpSubgroupPartitionedInclusiveOr:9893case glslang::EOpSubgroupPartitionedInclusiveXor:9894case glslang::EOpSubgroupPartitionedExclusiveAdd:9895case glslang::EOpSubgroupPartitionedExclusiveMul:9896case glslang::EOpSubgroupPartitionedExclusiveMin:9897case glslang::EOpSubgroupPartitionedExclusiveMax:9898case glslang::EOpSubgroupPartitionedExclusiveAnd:9899case glslang::EOpSubgroupPartitionedExclusiveOr:9900case glslang::EOpSubgroupPartitionedExclusiveXor:9901return createSubgroupOperation(op, typeId, operands, typeProxy);99029903case glslang::EOpSwizzleInvocations:9904extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);9905libCall = spv::SwizzleInvocationsAMD;9906break;9907case glslang::EOpSwizzleInvocationsMasked:9908extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);9909libCall = spv::SwizzleInvocationsMaskedAMD;9910break;9911case glslang::EOpWriteInvocation:9912extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);9913libCall = spv::WriteInvocationAMD;9914break;99159916case glslang::EOpMin3:9917extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);9918if (isFloat)9919libCall = spv::FMin3AMD;9920else {9921if (isUnsigned)9922libCall = spv::UMin3AMD;9923else9924libCall = spv::SMin3AMD;9925}9926break;9927case glslang::EOpMax3:9928extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);9929if (isFloat)9930libCall = spv::FMax3AMD;9931else {9932if (isUnsigned)9933libCall = spv::UMax3AMD;9934else9935libCall = spv::SMax3AMD;9936}9937break;9938case glslang::EOpMid3:9939extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);9940if (isFloat)9941libCall = spv::FMid3AMD;9942else {9943if (isUnsigned)9944libCall = spv::UMid3AMD;9945else9946libCall = spv::SMid3AMD;9947}9948break;99499950case glslang::EOpInterpolateAtVertex:9951if (typeProxy == glslang::EbtFloat16)9952builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);9953extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_explicit_vertex_parameter);9954libCall = spv::InterpolateAtVertexAMD;9955break;99569957case glslang::EOpReportIntersection:9958typeId = builder.makeBoolType();9959opCode = spv::Op::OpReportIntersectionKHR;9960break;9961case glslang::EOpTraceNV:9962builder.createNoResultOp(spv::Op::OpTraceNV, operands);9963return 0;9964case glslang::EOpTraceRayMotionNV:9965builder.addExtension(spv::E_SPV_NV_ray_tracing_motion_blur);9966builder.addCapability(spv::Capability::RayTracingMotionBlurNV);9967builder.createNoResultOp(spv::Op::OpTraceRayMotionNV, operands);9968return 0;9969case glslang::EOpTraceKHR:9970builder.createNoResultOp(spv::Op::OpTraceRayKHR, operands);9971return 0;9972case glslang::EOpExecuteCallableNV:9973builder.createNoResultOp(spv::Op::OpExecuteCallableNV, operands);9974return 0;9975case glslang::EOpExecuteCallableKHR:9976builder.createNoResultOp(spv::Op::OpExecuteCallableKHR, operands);9977return 0;99789979case glslang::EOpRayQueryInitialize:9980builder.createNoResultOp(spv::Op::OpRayQueryInitializeKHR, operands);9981return 0;9982case glslang::EOpRayQueryTerminate:9983builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR, operands);9984return 0;9985case glslang::EOpRayQueryGenerateIntersection:9986builder.createNoResultOp(spv::Op::OpRayQueryGenerateIntersectionKHR, operands);9987return 0;9988case glslang::EOpRayQueryConfirmIntersection:9989builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR, operands);9990return 0;9991case glslang::EOpRayQueryProceed:9992typeId = builder.makeBoolType();9993opCode = spv::Op::OpRayQueryProceedKHR;9994break;9995case glslang::EOpRayQueryGetIntersectionType:9996typeId = builder.makeUintType(32);9997opCode = spv::Op::OpRayQueryGetIntersectionTypeKHR;9998break;9999case glslang::EOpRayQueryGetRayTMin:10000typeId = builder.makeFloatType(32);10001opCode = spv::Op::OpRayQueryGetRayTMinKHR;10002break;10003case glslang::EOpRayQueryGetRayFlags:10004typeId = builder.makeIntType(32);10005opCode = spv::Op::OpRayQueryGetRayFlagsKHR;10006break;10007case glslang::EOpRayQueryGetIntersectionT:10008typeId = builder.makeFloatType(32);10009opCode = spv::Op::OpRayQueryGetIntersectionTKHR;10010break;10011case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:10012typeId = builder.makeIntType(32);10013opCode = spv::Op::OpRayQueryGetIntersectionInstanceCustomIndexKHR;10014break;10015case glslang::EOpRayQueryGetIntersectionInstanceId:10016typeId = builder.makeIntType(32);10017opCode = spv::Op::OpRayQueryGetIntersectionInstanceIdKHR;10018break;10019case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:10020typeId = builder.makeUintType(32);10021opCode = spv::Op::OpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffsetKHR;10022break;10023case glslang::EOpRayQueryGetIntersectionGeometryIndex:10024typeId = builder.makeIntType(32);10025opCode = spv::Op::OpRayQueryGetIntersectionGeometryIndexKHR;10026break;10027case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:10028typeId = builder.makeIntType(32);10029opCode = spv::Op::OpRayQueryGetIntersectionPrimitiveIndexKHR;10030break;10031case glslang::EOpRayQueryGetIntersectionBarycentrics:10032typeId = builder.makeVectorType(builder.makeFloatType(32), 2);10033opCode = spv::Op::OpRayQueryGetIntersectionBarycentricsKHR;10034break;10035case glslang::EOpRayQueryGetIntersectionFrontFace:10036typeId = builder.makeBoolType();10037opCode = spv::Op::OpRayQueryGetIntersectionFrontFaceKHR;10038break;10039case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:10040typeId = builder.makeBoolType();10041opCode = spv::Op::OpRayQueryGetIntersectionCandidateAABBOpaqueKHR;10042break;10043case glslang::EOpRayQueryGetIntersectionObjectRayDirection:10044typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10045opCode = spv::Op::OpRayQueryGetIntersectionObjectRayDirectionKHR;10046break;10047case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:10048typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10049opCode = spv::Op::OpRayQueryGetIntersectionObjectRayOriginKHR;10050break;10051case glslang::EOpRayQueryGetWorldRayDirection:10052typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10053opCode = spv::Op::OpRayQueryGetWorldRayDirectionKHR;10054break;10055case glslang::EOpRayQueryGetWorldRayOrigin:10056typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10057opCode = spv::Op::OpRayQueryGetWorldRayOriginKHR;10058break;10059case glslang::EOpRayQueryGetIntersectionObjectToWorld:10060typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);10061opCode = spv::Op::OpRayQueryGetIntersectionObjectToWorldKHR;10062break;10063case glslang::EOpRayQueryGetIntersectionClusterIdNV:10064typeId = builder.makeIntegerType(32, 1);10065opCode = spv::Op::OpRayQueryGetClusterIdNV;10066break;10067case glslang::EOpRayQueryGetIntersectionWorldToObject:10068typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);10069opCode = spv::Op::OpRayQueryGetIntersectionWorldToObjectKHR;10070break;10071case glslang::EOpRayQueryGetIntersectionSpherePositionNV:10072typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10073opCode = spv::Op::OpRayQueryGetIntersectionSpherePositionNV;10074break;10075case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:10076typeId = builder.makeFloatType(32);10077opCode = spv::Op::OpRayQueryGetIntersectionSphereRadiusNV;10078break;10079case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:10080typeId = builder.makeFloatType(32);10081opCode = spv::Op::OpRayQueryGetIntersectionLSSHitValueNV;10082break;10083case glslang::EOpRayQueryIsSphereHitNV:10084typeId = builder.makeBoolType();10085opCode = spv::Op::OpRayQueryIsSphereHitNV;10086break;10087case glslang::EOpRayQueryIsLSSHitNV:10088typeId = builder.makeBoolType();10089opCode = spv::Op::OpRayQueryIsLSSHitNV;10090break;10091case glslang::EOpWritePackedPrimitiveIndices4x8NV:10092builder.createNoResultOp(spv::Op::OpWritePackedPrimitiveIndices4x8NV, operands);10093return 0;10094case glslang::EOpEmitMeshTasksEXT:10095if (taskPayloadID)10096operands.push_back(taskPayloadID);10097// As per SPV_EXT_mesh_shader make it a terminating instruction in the current block10098builder.makeStatementTerminator(spv::Op::OpEmitMeshTasksEXT, operands, "post-OpEmitMeshTasksEXT");10099return 0;10100case glslang::EOpSetMeshOutputsEXT:10101builder.createNoResultOp(spv::Op::OpSetMeshOutputsEXT, operands);10102return 0;10103case glslang::EOpCooperativeMatrixMulAddNV:10104opCode = spv::Op::OpCooperativeMatrixMulAddNV;10105break;10106case glslang::EOpHitObjectTraceRayNV:10107builder.createNoResultOp(spv::Op::OpHitObjectTraceRayNV, operands);10108return 0;10109case glslang::EOpHitObjectTraceRayEXT:10110builder.createNoResultOp(spv::Op::OpHitObjectTraceRayEXT, operands);10111return 0;10112case glslang::EOpHitObjectTraceRayMotionNV:10113builder.createNoResultOp(spv::Op::OpHitObjectTraceRayMotionNV, operands);10114return 0;10115case glslang::EOpHitObjectTraceRayMotionEXT:10116builder.createNoResultOp(spv::Op::OpHitObjectTraceRayMotionEXT, operands);10117return 0;10118case glslang::EOpHitObjectRecordHitNV:10119builder.createNoResultOp(spv::Op::OpHitObjectRecordHitNV, operands);10120return 0;10121case glslang::EOpHitObjectRecordHitMotionNV:10122builder.createNoResultOp(spv::Op::OpHitObjectRecordHitMotionNV, operands);10123return 0;10124case glslang::EOpHitObjectRecordHitWithIndexNV:10125builder.createNoResultOp(spv::Op::OpHitObjectRecordHitWithIndexNV, operands);10126return 0;10127case glslang::EOpHitObjectRecordHitWithIndexMotionNV:10128builder.createNoResultOp(spv::Op::OpHitObjectRecordHitWithIndexMotionNV, operands);10129return 0;10130case glslang::EOpHitObjectRecordMissNV:10131builder.createNoResultOp(spv::Op::OpHitObjectRecordMissNV, operands);10132return 0;10133case glslang::EOpHitObjectRecordMissEXT:10134builder.createNoResultOp(spv::Op::OpHitObjectRecordMissEXT, operands);10135return 0;10136case glslang::EOpHitObjectRecordMissMotionNV:10137builder.createNoResultOp(spv::Op::OpHitObjectRecordMissMotionNV, operands);10138return 0;10139case glslang::EOpHitObjectRecordMissMotionEXT:10140builder.createNoResultOp(spv::Op::OpHitObjectRecordMissMotionEXT, operands);10141return 0;10142case glslang::EOpHitObjectExecuteShaderNV:10143builder.createNoResultOp(spv::Op::OpHitObjectExecuteShaderNV, operands);10144return 0;10145case glslang::EOpHitObjectExecuteShaderEXT:10146builder.createNoResultOp(spv::Op::OpHitObjectExecuteShaderEXT, operands);10147return 0;10148case glslang::EOpHitObjectIsEmptyNV:10149typeId = builder.makeBoolType();10150opCode = spv::Op::OpHitObjectIsEmptyNV;10151break;10152case glslang::EOpHitObjectIsEmptyEXT:10153typeId = builder.makeBoolType();10154opCode = spv::Op::OpHitObjectIsEmptyEXT;10155break;10156case glslang::EOpHitObjectIsMissNV:10157typeId = builder.makeBoolType();10158opCode = spv::Op::OpHitObjectIsMissNV;10159break;10160case glslang::EOpHitObjectIsMissEXT:10161typeId = builder.makeBoolType();10162opCode = spv::Op::OpHitObjectIsMissEXT;10163break;10164case glslang::EOpHitObjectIsHitNV:10165typeId = builder.makeBoolType();10166opCode = spv::Op::OpHitObjectIsHitNV;10167break;10168case glslang::EOpHitObjectIsSphereHitNV:10169typeId = builder.makeBoolType();10170opCode = spv::Op::OpHitObjectIsSphereHitNV;10171break;10172case glslang::EOpHitObjectIsLSSHitNV:10173typeId = builder.makeBoolType();10174opCode = spv::Op::OpHitObjectIsLSSHitNV;10175break;10176case glslang::EOpHitObjectIsHitEXT:10177typeId = builder.makeBoolType();10178opCode = spv::Op::OpHitObjectIsHitEXT;10179break;10180case glslang::EOpHitObjectGetRayTMinNV:10181typeId = builder.makeFloatType(32);10182opCode = spv::Op::OpHitObjectGetRayTMinNV;10183break;10184case glslang::EOpHitObjectGetRayTMinEXT:10185typeId = builder.makeFloatType(32);10186opCode = spv::Op::OpHitObjectGetRayTMinEXT;10187break;10188case glslang::EOpHitObjectGetRayTMaxNV:10189typeId = builder.makeFloatType(32);10190opCode = spv::Op::OpHitObjectGetRayTMaxNV;10191break;10192case glslang::EOpHitObjectGetRayTMaxEXT:10193typeId = builder.makeFloatType(32);10194opCode = spv::Op::OpHitObjectGetRayTMaxEXT;10195break;10196case glslang::EOpHitObjectGetRayFlagsEXT:10197typeId = builder.makeIntegerType(32, 0);10198opCode = spv::Op::OpHitObjectGetRayFlagsEXT;10199break;10200case glslang::EOpHitObjectGetObjectRayOriginNV:10201typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10202opCode = spv::Op::OpHitObjectGetObjectRayOriginNV;10203break;10204case glslang::EOpHitObjectGetObjectRayOriginEXT:10205typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10206opCode = spv::Op::OpHitObjectGetObjectRayOriginEXT;10207break;10208case glslang::EOpHitObjectGetObjectRayDirectionNV:10209typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10210opCode = spv::Op::OpHitObjectGetObjectRayDirectionNV;10211break;10212case glslang::EOpHitObjectGetObjectRayDirectionEXT:10213typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10214opCode = spv::Op::OpHitObjectGetObjectRayDirectionEXT;10215break;10216case glslang::EOpHitObjectGetWorldRayOriginNV:10217typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10218opCode = spv::Op::OpHitObjectGetWorldRayOriginNV;10219break;10220case glslang::EOpHitObjectGetWorldRayOriginEXT:10221typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10222opCode = spv::Op::OpHitObjectGetWorldRayOriginEXT;10223break;10224case glslang::EOpHitObjectGetWorldRayDirectionNV:10225typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10226opCode = spv::Op::OpHitObjectGetWorldRayDirectionNV;10227break;10228case glslang::EOpHitObjectGetWorldRayDirectionEXT:10229typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10230opCode = spv::Op::OpHitObjectGetWorldRayDirectionEXT;10231break;10232case glslang::EOpHitObjectGetWorldToObjectNV:10233typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);10234opCode = spv::Op::OpHitObjectGetWorldToObjectNV;10235break;10236case glslang::EOpHitObjectGetWorldToObjectEXT:10237typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);10238opCode = spv::Op::OpHitObjectGetWorldToObjectEXT;10239break;10240case glslang::EOpHitObjectGetObjectToWorldNV:10241typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);10242opCode = spv::Op::OpHitObjectGetObjectToWorldNV;10243break;10244case glslang::EOpHitObjectGetObjectToWorldEXT:10245typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);10246opCode = spv::Op::OpHitObjectGetObjectToWorldEXT;10247break;10248case glslang::EOpHitObjectGetInstanceCustomIndexNV:10249typeId = builder.makeIntegerType(32, 1);10250opCode = spv::Op::OpHitObjectGetInstanceCustomIndexNV;10251break;10252case glslang::EOpHitObjectGetInstanceCustomIndexEXT:10253typeId = builder.makeIntegerType(32, 1);10254opCode = spv::Op::OpHitObjectGetInstanceCustomIndexEXT;10255break;10256case glslang::EOpHitObjectGetInstanceIdNV:10257typeId = builder.makeIntegerType(32, 1);10258opCode = spv::Op::OpHitObjectGetInstanceIdNV;10259break;10260case glslang::EOpHitObjectGetInstanceIdEXT:10261typeId = builder.makeIntegerType(32, 1);10262opCode = spv::Op::OpHitObjectGetInstanceIdEXT;10263break;10264case glslang::EOpHitObjectGetGeometryIndexNV:10265typeId = builder.makeIntegerType(32, 1);10266opCode = spv::Op::OpHitObjectGetGeometryIndexNV;10267break;10268case glslang::EOpHitObjectGetGeometryIndexEXT:10269typeId = builder.makeIntegerType(32, 1);10270opCode = spv::Op::OpHitObjectGetGeometryIndexEXT;10271break;10272case glslang::EOpHitObjectGetPrimitiveIndexNV:10273typeId = builder.makeIntegerType(32, 1);10274opCode = spv::Op::OpHitObjectGetPrimitiveIndexNV;10275break;10276case glslang::EOpHitObjectGetPrimitiveIndexEXT:10277typeId = builder.makeIntegerType(32, 1);10278opCode = spv::Op::OpHitObjectGetPrimitiveIndexEXT;10279break;10280case glslang::EOpHitObjectGetHitKindNV:10281typeId = builder.makeIntegerType(32, 0);10282opCode = spv::Op::OpHitObjectGetHitKindNV;10283break;10284case glslang::EOpHitObjectGetHitKindEXT:10285typeId = builder.makeIntegerType(32, 0);10286opCode = spv::Op::OpHitObjectGetHitKindEXT;10287break;10288case glslang::EOpHitObjectGetCurrentTimeNV:10289typeId = builder.makeFloatType(32);10290opCode = spv::Op::OpHitObjectGetCurrentTimeNV;10291break;10292case glslang::EOpHitObjectGetCurrentTimeEXT:10293typeId = builder.makeFloatType(32);10294opCode = spv::Op::OpHitObjectGetCurrentTimeEXT;10295break;10296case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:10297typeId = builder.makeIntegerType(32, 0);10298opCode = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexNV;10299return 0;10300case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:10301typeId = builder.makeIntegerType(32, 0);10302opCode = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexEXT;10303return 0;10304case glslang::EOpHitObjectGetAttributesNV:10305builder.createNoResultOp(spv::Op::OpHitObjectGetAttributesNV, operands);10306return 0;10307case glslang::EOpHitObjectGetAttributesEXT:10308builder.createNoResultOp(spv::Op::OpHitObjectGetAttributesEXT, operands);10309return 0;10310case glslang::EOpHitObjectRecordFromQueryEXT:10311builder.createNoResultOp(spv::Op::OpHitObjectRecordFromQueryEXT, operands);10312return 0;10313case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:10314typeId = builder.makeVectorType(builder.makeUintType(32), 2);10315opCode = spv::Op::OpHitObjectGetShaderRecordBufferHandleNV;10316break;10317case glslang::EOpHitObjectGetClusterIdNV:10318typeId = builder.makeIntegerType(32, 1);10319opCode = spv::Op::OpHitObjectGetClusterIdNV;10320break;10321case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:10322typeId = builder.makeVectorType(builder.makeUintType(32), 2);10323opCode = spv::Op::OpHitObjectGetShaderRecordBufferHandleEXT;10324break;10325case glslang::EOpHitObjectSetShaderBindingTableRecordIndexEXT:10326builder.createNoResultOp(spv::Op::OpHitObjectSetShaderBindingTableRecordIndexEXT, operands);10327return 0;10328case glslang::EOpReorderThreadNV: {10329if (operands.size() == 2) {10330builder.createNoResultOp(spv::Op::OpReorderThreadWithHintNV, operands);10331} else {10332builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectNV, operands);10333}10334return 0;10335}10336case glslang::EOpReorderThreadEXT: {10337if (operands.size() == 2) {10338builder.createNoResultOp(spv::Op::OpReorderThreadWithHintEXT, operands);10339} else {10340builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectEXT, operands);10341}10342return 0;10343}1034410345case glslang::EOpHitObjectReorderExecuteEXT: {10346if (operands.size() == 2) {10347builder.createNoResultOp(spv::Op::OpHitObjectReorderExecuteShaderEXT, operands);10348} else {10349// GLSL intrinsic is10350// hitObjectReorderExecuteEXT(hitObjectEXT hitObject, uint hint, uint bits,int payload) while10351// SPIRV is hitObject id , payload id, optional hint id, optional bits id hence reorder operands10352builder.createNoResultOp(spv::Op::OpHitObjectReorderExecuteShaderEXT, {operands[0], operands[3], operands[1], operands[2]});10353}10354return 0;10355}1035610357case glslang::EOpHitObjectTraceReorderExecuteEXT: {10358if (operands.size() == 12) {10359builder.createNoResultOp(spv::Op::OpHitObjectTraceReorderExecuteEXT, operands);10360} else {10361std::vector<spv::Id> argOperands;10362std::copy(operands.begin(), operands.begin() + 11, std::back_inserter(argOperands));10363argOperands.push_back(operands[13]);10364argOperands.push_back(operands[11]);10365argOperands.push_back(operands[12]);10366builder.createNoResultOp(spv::Op::OpHitObjectTraceReorderExecuteEXT, argOperands);10367}10368return 0;10369}10370case glslang::EOpHitObjectTraceMotionReorderExecuteEXT: {10371if (operands.size() == 13) {10372builder.createNoResultOp(spv::Op::OpHitObjectTraceMotionReorderExecuteEXT, operands);10373} else {10374std::vector<spv::Id> argOperands;10375std::copy(operands.begin(), operands.begin() + 12, std::back_inserter(argOperands));10376argOperands.push_back(operands[14]);10377argOperands.push_back(operands[12]);10378argOperands.push_back(operands[13]);10379builder.createNoResultOp(spv::Op::OpHitObjectTraceMotionReorderExecuteEXT, argOperands);10380}10381return 0;10382}10383case glslang::EOpImageSampleWeightedQCOM:10384typeId = builder.makeVectorType(builder.makeFloatType(32), 4);10385opCode = spv::Op::OpImageSampleWeightedQCOM;10386addImageProcessingQCOMDecoration(operands[2], spv::Decoration::WeightTextureQCOM);10387break;10388case glslang::EOpImageBoxFilterQCOM:10389typeId = builder.makeVectorType(builder.makeFloatType(32), 4);10390opCode = spv::Op::OpImageBoxFilterQCOM;10391break;10392case glslang::EOpImageBlockMatchSADQCOM:10393typeId = builder.makeVectorType(builder.makeFloatType(32), 4);10394opCode = spv::Op::OpImageBlockMatchSADQCOM;10395addImageProcessingQCOMDecoration(operands[0], spv::Decoration::BlockMatchTextureQCOM);10396addImageProcessingQCOMDecoration(operands[2], spv::Decoration::BlockMatchTextureQCOM);10397break;10398case glslang::EOpImageBlockMatchSSDQCOM:10399typeId = builder.makeVectorType(builder.makeFloatType(32), 4);10400opCode = spv::Op::OpImageBlockMatchSSDQCOM;10401addImageProcessingQCOMDecoration(operands[0], spv::Decoration::BlockMatchTextureQCOM);10402addImageProcessingQCOMDecoration(operands[2], spv::Decoration::BlockMatchTextureQCOM);10403break;1040410405case glslang::EOpFetchMicroTriangleVertexBarycentricNV:10406typeId = builder.makeVectorType(builder.makeFloatType(32), 2);10407opCode = spv::Op::OpFetchMicroTriangleVertexBarycentricNV;10408break;1040910410case glslang::EOpFetchMicroTriangleVertexPositionNV:10411typeId = builder.makeVectorType(builder.makeFloatType(32), 3);10412opCode = spv::Op::OpFetchMicroTriangleVertexPositionNV;10413break;1041410415case glslang::EOpImageBlockMatchWindowSSDQCOM:10416typeId = builder.makeVectorType(builder.makeFloatType(32), 4);10417opCode = spv::Op::OpImageBlockMatchWindowSSDQCOM;10418addImageProcessing2QCOMDecoration(operands[0], false);10419addImageProcessing2QCOMDecoration(operands[2], false);10420break;10421case glslang::EOpImageBlockMatchWindowSADQCOM:10422typeId = builder.makeVectorType(builder.makeFloatType(32), 4);10423opCode = spv::Op::OpImageBlockMatchWindowSADQCOM;10424addImageProcessing2QCOMDecoration(operands[0], false);10425addImageProcessing2QCOMDecoration(operands[2], false);10426break;10427case glslang::EOpImageBlockMatchGatherSSDQCOM:10428typeId = builder.makeVectorType(builder.makeFloatType(32), 4);10429opCode = spv::Op::OpImageBlockMatchGatherSSDQCOM;10430addImageProcessing2QCOMDecoration(operands[0], true);10431addImageProcessing2QCOMDecoration(operands[2], true);10432break;10433case glslang::EOpImageBlockMatchGatherSADQCOM:10434typeId = builder.makeVectorType(builder.makeFloatType(32), 4);10435opCode = spv::Op::OpImageBlockMatchGatherSADQCOM;10436addImageProcessing2QCOMDecoration(operands[0], true);10437addImageProcessing2QCOMDecoration(operands[2], true);10438break;10439case glslang::EOpCreateTensorLayoutNV:10440return builder.createOp(spv::Op::OpCreateTensorLayoutNV, typeId, std::vector<spv::Id>{});10441case glslang::EOpCreateTensorViewNV:10442return builder.createOp(spv::Op::OpCreateTensorViewNV, typeId, std::vector<spv::Id>{});10443case glslang::EOpTensorLayoutSetBlockSizeNV:10444opCode = spv::Op::OpTensorLayoutSetBlockSizeNV;10445break;10446case glslang::EOpTensorLayoutSetDimensionNV:10447opCode = spv::Op::OpTensorLayoutSetDimensionNV;10448break;10449case glslang::EOpTensorLayoutSetStrideNV:10450opCode = spv::Op::OpTensorLayoutSetStrideNV;10451break;10452case glslang::EOpTensorLayoutSliceNV:10453opCode = spv::Op::OpTensorLayoutSliceNV;10454break;10455case glslang::EOpTensorLayoutSetClampValueNV:10456opCode = spv::Op::OpTensorLayoutSetClampValueNV;10457break;10458case glslang::EOpTensorViewSetDimensionNV:10459opCode = spv::Op::OpTensorViewSetDimensionNV;10460break;10461case glslang::EOpTensorViewSetStrideNV:10462opCode = spv::Op::OpTensorViewSetStrideNV;10463break;10464case glslang::EOpTensorViewSetClipNV:10465opCode = spv::Op::OpTensorViewSetClipNV;10466break;10467default:10468return 0;10469}1047010471spv::Id id = 0;10472if (libCall >= 0) {10473// Use an extended instruction from the standard library.10474// Construct the call arguments, without modifying the original operands vector.10475// We might need the remaining arguments, e.g. in the EOpFrexp case.10476std::vector<spv::Id> callArguments(operands.begin(), operands.begin() + consumedOperands);10477id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, callArguments);10478} else if (opCode == spv::Op::OpDot && !isFloat) {10479// int dot(int, int)10480// NOTE: never called for scalar/vector1, this is turned into simple mul before this can be reached10481const int componentCount = builder.getNumComponents(operands[0]);10482spv::Id mulOp = builder.createBinOp(spv::Op::OpIMul, builder.getTypeId(operands[0]), operands[0], operands[1]);10483builder.setPrecision(mulOp, precision);10484id = builder.createCompositeExtract(mulOp, typeId, 0);10485for (int i = 1; i < componentCount; ++i) {10486builder.setPrecision(id, precision);10487id = builder.createBinOp(spv::Op::OpIAdd, typeId, id, builder.createCompositeExtract(mulOp, typeId, i));10488}10489} else {10490switch (consumedOperands) {10491case 0:10492// should all be handled by visitAggregate and createNoArgOperation10493assert(0);10494return 0;10495case 1:10496// should all be handled by createUnaryOperation10497assert(0);10498return 0;10499case 2:10500id = builder.createBinOp(opCode, typeId, operands[0], operands[1]);10501break;10502default:10503// anything 3 or over doesn't have l-value operands, so all should be consumed10504assert(consumedOperands == operands.size());10505id = builder.createOp(opCode, typeId, operands);10506break;10507}10508}1050910510// Decode the return types that were structures10511switch (op) {10512case glslang::EOpAddCarry:10513case glslang::EOpSubBorrow:10514builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);10515id = builder.createCompositeExtract(id, typeId0, 0);10516break;10517case glslang::EOpUMulExtended:10518case glslang::EOpIMulExtended:10519builder.createStore(builder.createCompositeExtract(id, typeId0, 0), operands[3]);10520builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);10521break;10522case glslang::EOpModf:10523{10524assert(operands.size() == 2);10525builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[1]);10526id = builder.createCompositeExtract(id, typeId0, 0);10527}10528break;10529case glslang::EOpFrexp:10530{10531assert(operands.size() == 2);10532if (builder.isFloatType(builder.getScalarTypeId(typeId1))) {10533// "exp" is floating-point type (from HLSL intrinsic)10534spv::Id member1 = builder.createCompositeExtract(id, frexpIntType, 1);10535member1 = builder.createUnaryOp(spv::Op::OpConvertSToF, typeId1, member1);10536builder.createStore(member1, operands[1]);10537} else10538// "exp" is integer type (from GLSL built-in function)10539builder.createStore(builder.createCompositeExtract(id, frexpIntType, 1), operands[1]);10540id = builder.createCompositeExtract(id, typeId0, 0);10541}10542break;10543default:10544break;10545}1054610547return builder.setPrecision(id, precision);10548}1054910550// Intrinsics with no arguments (or no return value, and no precision).10551spv::Id TGlslangToSpvTraverser::createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId)10552{10553// GLSL memory barriers use queuefamily scope in new model, device scope in old model10554spv::Scope memoryBarrierScope = glslangIntermediate->usingVulkanMemoryModel() ?10555spv::Scope::QueueFamilyKHR : spv::Scope::Device;1055610557switch (op) {10558case glslang::EOpBarrier:10559if (glslangIntermediate->getStage() == EShLangTessControl) {10560if (glslangIntermediate->usingVulkanMemoryModel()) {10561builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,10562spv::MemorySemanticsMask::OutputMemoryKHR |10563spv::MemorySemanticsMask::AcquireRelease);10564builder.addCapability(spv::Capability::VulkanMemoryModelKHR);10565} else {10566builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Invocation, spv::MemorySemanticsMask::MaskNone);10567}10568} else {10569builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,10570spv::MemorySemanticsMask::WorkgroupMemory |10571spv::MemorySemanticsMask::AcquireRelease);10572}10573return 0;10574case glslang::EOpMemoryBarrier:10575builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsAllMemory |10576spv::MemorySemanticsMask::AcquireRelease);10577return 0;10578case glslang::EOpMemoryBarrierBuffer:10579builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::UniformMemory |10580spv::MemorySemanticsMask::AcquireRelease);10581return 0;10582case glslang::EOpMemoryBarrierShared:10583builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::WorkgroupMemory |10584spv::MemorySemanticsMask::AcquireRelease);10585return 0;10586case glslang::EOpGroupMemoryBarrier:10587builder.createMemoryBarrier(spv::Scope::Workgroup, spv::MemorySemanticsAllMemory |10588spv::MemorySemanticsMask::AcquireRelease);10589return 0;10590case glslang::EOpMemoryBarrierAtomicCounter:10591builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::AtomicCounterMemory |10592spv::MemorySemanticsMask::AcquireRelease);10593return 0;10594case glslang::EOpMemoryBarrierImage:10595builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::ImageMemory |10596spv::MemorySemanticsMask::AcquireRelease);10597return 0;10598case glslang::EOpAllMemoryBarrierWithGroupSync:10599builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Device,10600spv::MemorySemanticsAllMemory |10601spv::MemorySemanticsMask::AcquireRelease);10602return 0;10603case glslang::EOpDeviceMemoryBarrier:10604builder.createMemoryBarrier(spv::Scope::Device, spv::MemorySemanticsMask::UniformMemory |10605spv::MemorySemanticsMask::ImageMemory |10606spv::MemorySemanticsMask::AcquireRelease);10607return 0;10608case glslang::EOpDeviceMemoryBarrierWithGroupSync:10609builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Device, spv::MemorySemanticsMask::UniformMemory |10610spv::MemorySemanticsMask::ImageMemory |10611spv::MemorySemanticsMask::AcquireRelease);10612return 0;10613case glslang::EOpWorkgroupMemoryBarrier:10614builder.createMemoryBarrier(spv::Scope::Workgroup, spv::MemorySemanticsMask::WorkgroupMemory |10615spv::MemorySemanticsMask::AcquireRelease);10616return 0;10617case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:10618builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,10619spv::MemorySemanticsMask::WorkgroupMemory |10620spv::MemorySemanticsMask::AcquireRelease);10621return 0;10622case glslang::EOpSubgroupBarrier:10623builder.createControlBarrier(spv::Scope::Subgroup, spv::Scope::Subgroup, spv::MemorySemanticsAllMemory |10624spv::MemorySemanticsMask::AcquireRelease);10625return spv::NoResult;10626case glslang::EOpSubgroupMemoryBarrier:10627builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsAllMemory |10628spv::MemorySemanticsMask::AcquireRelease);10629return spv::NoResult;10630case glslang::EOpSubgroupMemoryBarrierBuffer:10631builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::UniformMemory |10632spv::MemorySemanticsMask::AcquireRelease);10633return spv::NoResult;10634case glslang::EOpSubgroupMemoryBarrierImage:10635builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::ImageMemory |10636spv::MemorySemanticsMask::AcquireRelease);10637return spv::NoResult;10638case glslang::EOpSubgroupMemoryBarrierShared:10639builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::WorkgroupMemory |10640spv::MemorySemanticsMask::AcquireRelease);10641return spv::NoResult;1064210643case glslang::EOpEmitVertex:10644builder.createNoResultOp(spv::Op::OpEmitVertex);10645return 0;10646case glslang::EOpEndPrimitive:10647builder.createNoResultOp(spv::Op::OpEndPrimitive);10648return 0;1064910650case glslang::EOpSubgroupElect: {10651std::vector<spv::Id> operands;10652return createSubgroupOperation(op, typeId, operands, glslang::EbtVoid);10653}10654case glslang::EOpTime:10655{10656std::vector<spv::Id> args; // Dummy arguments10657spv::Id id = builder.createBuiltinCall(typeId, getExtBuiltins(spv::E_SPV_AMD_gcn_shader), spv::TimeAMD, args);10658return builder.setPrecision(id, precision);10659}10660case glslang::EOpIgnoreIntersectionNV:10661builder.createNoResultOp(spv::Op::OpIgnoreIntersectionNV);10662return 0;10663case glslang::EOpTerminateRayNV:10664builder.createNoResultOp(spv::Op::OpTerminateRayNV);10665return 0;10666case glslang::EOpRayQueryInitialize:10667builder.createNoResultOp(spv::Op::OpRayQueryInitializeKHR);10668return 0;10669case glslang::EOpRayQueryTerminate:10670builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR);10671return 0;10672case glslang::EOpRayQueryGenerateIntersection:10673builder.createNoResultOp(spv::Op::OpRayQueryGenerateIntersectionKHR);10674return 0;10675case glslang::EOpRayQueryConfirmIntersection:10676builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR);10677return 0;10678case glslang::EOpBeginInvocationInterlock:10679builder.createNoResultOp(spv::Op::OpBeginInvocationInterlockEXT);10680return 0;10681case glslang::EOpEndInvocationInterlock:10682builder.createNoResultOp(spv::Op::OpEndInvocationInterlockEXT);10683return 0;1068410685case glslang::EOpIsHelperInvocation:10686{10687std::vector<spv::Id> args; // Dummy arguments10688builder.addExtension(spv::E_SPV_EXT_demote_to_helper_invocation);10689builder.addCapability(spv::Capability::DemoteToHelperInvocationEXT);10690return builder.createOp(spv::Op::OpIsHelperInvocationEXT, typeId, args);10691}1069210693case glslang::EOpReadClockSubgroupKHR: {10694std::vector<spv::Id> args;10695args.push_back(builder.makeUintConstant(spv::Scope::Subgroup));10696builder.addExtension(spv::E_SPV_KHR_shader_clock);10697builder.addCapability(spv::Capability::ShaderClockKHR);10698return builder.createOp(spv::Op::OpReadClockKHR, typeId, args);10699}1070010701case glslang::EOpReadClockDeviceKHR: {10702std::vector<spv::Id> args;10703args.push_back(builder.makeUintConstant(spv::Scope::Device));10704builder.addExtension(spv::E_SPV_KHR_shader_clock);10705builder.addCapability(spv::Capability::ShaderClockKHR);10706return builder.createOp(spv::Op::OpReadClockKHR, typeId, args);10707}10708case glslang::EOpStencilAttachmentReadEXT:10709case glslang::EOpDepthAttachmentReadEXT:10710{10711builder.addExtension(spv::E_SPV_EXT_shader_tile_image);1071210713spv::Decoration precision;10714spv::Op spv_op;10715if (op == glslang::EOpStencilAttachmentReadEXT)10716{10717precision = spv::Decoration::RelaxedPrecision;10718spv_op = spv::Op::OpStencilAttachmentReadEXT;10719builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);10720}10721else10722{10723precision = spv::NoPrecision;10724spv_op = spv::Op::OpDepthAttachmentReadEXT;10725builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);10726}1072710728std::vector<spv::Id> args; // Dummy args10729spv::Id result = builder.createOp(spv_op, typeId, args);10730return builder.setPrecision(result, precision);10731}10732default:10733break;10734}1073510736logger->missingFunctionality("unknown operation with no arguments");1073710738return 0;10739}1074010741spv::Id TGlslangToSpvTraverser::getSymbolId(const glslang::TIntermSymbol* symbol)10742{10743auto iter = symbolValues.find(symbol->getId());10744spv::Id id;10745if (symbolValues.end() != iter) {10746id = iter->second;10747return id;10748}1074910750// it was not found, create it10751spv::BuiltIn builtIn = TranslateBuiltInDecoration(symbol->getQualifier().builtIn, false);10752auto forcedType = getForcedType(symbol->getQualifier().builtIn, symbol->getType());1075310754// There are pairs of symbols that map to the same SPIR-V built-in:10755// gl_ObjectToWorldEXT and gl_ObjectToWorld3x4EXT, and gl_WorldToObjectEXT10756// and gl_WorldToObject3x4EXT. SPIR-V forbids having two OpVariables10757// with the same BuiltIn in the same storage class, so we must re-use one.10758const bool mayNeedToReuseBuiltIn =10759builtIn == spv::BuiltIn::ObjectToWorldKHR ||10760builtIn == spv::BuiltIn::WorldToObjectKHR;1076110762if (mayNeedToReuseBuiltIn) {10763auto iter = builtInVariableIds.find(uint32_t(builtIn));10764if (builtInVariableIds.end() != iter) {10765id = iter->second;10766symbolValues[symbol->getId()] = id;10767if (forcedType.second != spv::NoType)10768forceType[id] = forcedType.second;10769return id;10770}10771}1077210773if (symbol->getBasicType() == glslang::EbtFunction) {10774return 0;10775}1077610777id = createSpvVariable(symbol, forcedType.first);1077810779if (mayNeedToReuseBuiltIn) {10780builtInVariableIds.insert({uint32_t(builtIn), id});10781}1078210783symbolValues[symbol->getId()] = id;10784if (forcedType.second != spv::NoType)10785forceType[id] = forcedType.second;1078610787if (symbol->getBasicType() != glslang::EbtBlock) {10788builder.addDecoration(id, TranslatePrecisionDecoration(symbol->getType()));10789builder.addDecoration(id, TranslateInterpolationDecoration(symbol->getType().getQualifier()));10790builder.addDecoration(id, TranslateAuxiliaryStorageDecoration(symbol->getType().getQualifier()));10791addMeshNVDecoration(id, /*member*/ -1, symbol->getType().getQualifier());10792if (symbol->getQualifier().hasComponent())10793builder.addDecoration(id, spv::Decoration::Component, symbol->getQualifier().layoutComponent);10794if (symbol->getQualifier().hasIndex())10795builder.addDecoration(id, spv::Decoration::Index, symbol->getQualifier().layoutIndex);10796if (symbol->getType().getQualifier().hasSpecConstantId())10797builder.addDecoration(id, spv::Decoration::SpecId, symbol->getType().getQualifier().layoutSpecConstantId);10798// atomic counters use this:10799if (symbol->getQualifier().hasOffset())10800builder.addDecoration(id, spv::Decoration::Offset, symbol->getQualifier().layoutOffset);10801}1080210803if (symbol->getQualifier().hasLocation()) {10804if (!(glslangIntermediate->isRayTracingStage() &&10805(glslangIntermediate->IsRequestedExtension(glslang::E_GL_EXT_ray_tracing) ||10806glslangIntermediate->IsRequestedExtension(glslang::E_GL_NV_shader_invocation_reorder) ||10807glslangIntermediate->IsRequestedExtension(glslang::E_GL_EXT_shader_invocation_reorder))10808&& (builder.getStorageClass(id) == spv::StorageClass::RayPayloadKHR ||10809builder.getStorageClass(id) == spv::StorageClass::IncomingRayPayloadKHR ||10810builder.getStorageClass(id) == spv::StorageClass::CallableDataKHR ||10811builder.getStorageClass(id) == spv::StorageClass::IncomingCallableDataKHR ||10812builder.getStorageClass(id) == spv::StorageClass::HitObjectAttributeEXT ||10813builder.getStorageClass(id) == spv::StorageClass::HitObjectAttributeNV))) {10814// Location values are used to link TraceRayKHR/ExecuteCallableKHR/HitObjectGetAttributesNV10815// to corresponding variables but are not valid in SPIRV since they are supported only10816// for Input/Output Storage classes.10817builder.addDecoration(id, spv::Decoration::Location, symbol->getQualifier().layoutLocation);10818}10819}1082010821builder.addDecoration(id, TranslateInvariantDecoration(symbol->getType().getQualifier()));10822if (symbol->getQualifier().hasStream() && glslangIntermediate->isMultiStream()) {10823builder.addCapability(spv::Capability::GeometryStreams);10824builder.addDecoration(id, spv::Decoration::Stream, symbol->getQualifier().layoutStream);10825}10826if (symbol->getQualifier().hasSet())10827builder.addDecoration(id, spv::Decoration::DescriptorSet, symbol->getQualifier().layoutSet);10828else if (IsDescriptorResource(symbol->getType())) {10829// default to 010830builder.addDecoration(id, spv::Decoration::DescriptorSet, 0);10831}10832if (symbol->getQualifier().hasBinding())10833builder.addDecoration(id, spv::Decoration::Binding, symbol->getQualifier().layoutBinding);10834else if (IsDescriptorResource(symbol->getType())) {10835// default to 010836builder.addDecoration(id, spv::Decoration::Binding, 0);10837}10838if (symbol->getQualifier().hasAttachment())10839builder.addDecoration(id, spv::Decoration::InputAttachmentIndex, symbol->getQualifier().layoutAttachment);10840if (glslangIntermediate->getXfbMode()) {10841builder.addCapability(spv::Capability::TransformFeedback);10842if (symbol->getQualifier().hasXfbBuffer()) {10843builder.addDecoration(id, spv::Decoration::XfbBuffer, symbol->getQualifier().layoutXfbBuffer);10844unsigned stride = glslangIntermediate->getXfbStride(symbol->getQualifier().layoutXfbBuffer);10845if (stride != glslang::TQualifier::layoutXfbStrideEnd)10846builder.addDecoration(id, spv::Decoration::XfbStride, stride);10847}10848if (symbol->getQualifier().hasXfbOffset())10849builder.addDecoration(id, spv::Decoration::Offset, symbol->getQualifier().layoutXfbOffset);10850}1085110852// add built-in variable decoration10853if (builtIn != spv::BuiltIn::Max) {10854// WorkgroupSize deprecated in spirv1.610855if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_6 ||10856builtIn != spv::BuiltIn::WorkgroupSize)10857builder.addDecoration(id, spv::Decoration::BuiltIn, (int)builtIn);10858}1085910860// Add volatile decoration to HelperInvocation for spirv1.6 and beyond10861if (builtIn == spv::BuiltIn::HelperInvocation &&10862!glslangIntermediate->usingVulkanMemoryModel() &&10863glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {10864builder.addDecoration(id, spv::Decoration::Volatile);10865}1086610867// Subgroup builtins which have input storage class are volatile for ray tracing stages.10868if (symbol->getType().isImage() || symbol->getQualifier().isPipeInput()) {10869std::vector<spv::Decoration> memory;10870TranslateMemoryDecoration(symbol->getType().getQualifier(), memory,10871glslangIntermediate->usingVulkanMemoryModel());10872for (unsigned int i = 0; i < memory.size(); ++i)10873builder.addDecoration(id, memory[i]);10874}1087510876if (builtIn == spv::BuiltIn::SampleMask) {10877spv::Decoration decoration;10878// GL_NV_sample_mask_override_coverage extension10879if (glslangIntermediate->getLayoutOverrideCoverage())10880decoration = spv::Decoration::OverrideCoverageNV;10881else10882decoration = spv::Decoration::Max;10883builder.addDecoration(id, decoration);10884if (decoration != spv::Decoration::Max) {10885builder.addCapability(spv::Capability::SampleMaskOverrideCoverageNV);10886builder.addExtension(spv::E_SPV_NV_sample_mask_override_coverage);10887}10888}10889else if (builtIn == spv::BuiltIn::Layer) {10890// SPV_NV_viewport_array2 extension10891if (symbol->getQualifier().layoutViewportRelative) {10892builder.addDecoration(id, spv::Decoration::ViewportRelativeNV);10893builder.addCapability(spv::Capability::ShaderViewportMaskNV);10894builder.addExtension(spv::E_SPV_NV_viewport_array2);10895}10896if (symbol->getQualifier().layoutSecondaryViewportRelativeOffset != -2048) {10897builder.addDecoration(id, spv::Decoration::SecondaryViewportRelativeNV,10898symbol->getQualifier().layoutSecondaryViewportRelativeOffset);10899builder.addCapability(spv::Capability::ShaderStereoViewNV);10900builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);10901}10902}1090310904if (symbol->getQualifier().layoutPassthrough) {10905builder.addDecoration(id, spv::Decoration::PassthroughNV);10906builder.addCapability(spv::Capability::GeometryShaderPassthroughNV);10907builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);10908}10909if (symbol->getQualifier().pervertexNV) {10910builder.addDecoration(id, spv::Decoration::PerVertexNV);10911builder.addCapability(spv::Capability::FragmentBarycentricNV);10912builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);10913}1091410915if (symbol->getQualifier().pervertexEXT) {10916builder.addDecoration(id, spv::Decoration::PerVertexKHR);10917builder.addCapability(spv::Capability::FragmentBarycentricKHR);10918builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);10919}1092010921if (glslangIntermediate->getHlslFunctionality1() && symbol->getType().getQualifier().semanticName != nullptr) {10922builder.addExtension("SPV_GOOGLE_hlsl_functionality1");10923builder.addDecoration(id, spv::Decoration::HlslSemanticGOOGLE,10924symbol->getType().getQualifier().semanticName);10925}1092610927if (symbol->isReference()) {10928builder.addDecoration(id, symbol->getType().getQualifier().restrict ?10929spv::Decoration::RestrictPointerEXT : spv::Decoration::AliasedPointerEXT);10930}1093110932// Add SPIR-V decorations (GL_EXT_spirv_intrinsics)10933if (symbol->getType().getQualifier().hasSpirvDecorate())10934applySpirvDecorate(symbol->getType(), id, {});1093510936return id;10937}1093810939// add per-primitive, per-view. per-task decorations to a struct member (member >= 0) or an object10940void TGlslangToSpvTraverser::addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier& qualifier)10941{10942bool isMeshShaderExt = (glslangIntermediate->getRequestedExtensions().find(glslang::E_GL_EXT_mesh_shader) !=10943glslangIntermediate->getRequestedExtensions().end());1094410945if (member >= 0) {10946if (qualifier.perPrimitiveNV) {10947// Need to add capability/extension for fragment shader.10948// Mesh shader already adds this by default.10949if (glslangIntermediate->getStage() == EShLangFragment) {10950if(isMeshShaderExt) {10951builder.addCapability(spv::Capability::MeshShadingEXT);10952builder.addExtension(spv::E_SPV_EXT_mesh_shader);10953} else {10954builder.addCapability(spv::Capability::MeshShadingNV);10955builder.addExtension(spv::E_SPV_NV_mesh_shader);10956}10957}10958builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerPrimitiveNV);10959}10960if (qualifier.perViewNV)10961builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerViewNV);10962if (qualifier.perTaskNV)10963builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerTaskNV);10964} else {10965if (qualifier.perPrimitiveNV) {10966// Need to add capability/extension for fragment shader.10967// Mesh shader already adds this by default.10968if (glslangIntermediate->getStage() == EShLangFragment) {10969if(isMeshShaderExt) {10970builder.addCapability(spv::Capability::MeshShadingEXT);10971builder.addExtension(spv::E_SPV_EXT_mesh_shader);10972} else {10973builder.addCapability(spv::Capability::MeshShadingNV);10974builder.addExtension(spv::E_SPV_NV_mesh_shader);10975}10976}10977builder.addDecoration(id, spv::Decoration::PerPrimitiveNV);10978}10979if (qualifier.perViewNV)10980builder.addDecoration(id, spv::Decoration::PerViewNV);10981if (qualifier.perTaskNV)10982builder.addDecoration(id, spv::Decoration::PerTaskNV);10983}10984}1098510986bool TGlslangToSpvTraverser::hasQCOMImageProceessingDecoration(spv::Id id, spv::Decoration decor)10987{10988std::vector<spv::Decoration> &decoVec = idToQCOMDecorations[id];10989for ( auto d : decoVec ) {10990if ( d == decor )10991return true;10992}10993return false;10994}1099510996void TGlslangToSpvTraverser::addImageProcessingQCOMDecoration(spv::Id id, spv::Decoration decor)10997{10998spv::Op opc = builder.getOpCode(id);10999if (opc == spv::Op::OpSampledImage) {11000id = builder.getIdOperand(id, 0);11001opc = builder.getOpCode(id);11002}1100311004if (opc == spv::Op::OpLoad) {11005spv::Id texid = builder.getIdOperand(id, 0);11006if (!hasQCOMImageProceessingDecoration(texid, decor)) {//11007builder.addDecoration(texid, decor);11008idToQCOMDecorations[texid].push_back(decor);11009}11010}11011}1101211013void TGlslangToSpvTraverser::addImageProcessing2QCOMDecoration(spv::Id id, bool isForGather)11014{11015if (isForGather) {11016return addImageProcessingQCOMDecoration(id, spv::Decoration::BlockMatchTextureQCOM);11017}1101811019auto addDecor =11020[this](spv::Id id, spv::Decoration decor) {11021spv::Op tsopc = this->builder.getOpCode(id);11022if (tsopc == spv::Op::OpLoad) {11023spv::Id tsid = this->builder.getIdOperand(id, 0);11024if (this->glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {11025assert(iOSet.count(tsid) > 0);11026}11027if (!hasQCOMImageProceessingDecoration(tsid, decor)) {11028this->builder.addDecoration(tsid, decor);11029idToQCOMDecorations[tsid].push_back(decor);11030}11031}11032};1103311034spv::Op opc = builder.getOpCode(id);11035bool isInterfaceObject = (opc != spv::Op::OpSampledImage);1103611037if (!isInterfaceObject) {11038addDecor(builder.getIdOperand(id, 0), spv::Decoration::BlockMatchTextureQCOM);11039addDecor(builder.getIdOperand(id, 1), spv::Decoration::BlockMatchSamplerQCOM);11040} else {11041addDecor(id, spv::Decoration::BlockMatchTextureQCOM);11042addDecor(id, spv::Decoration::BlockMatchSamplerQCOM);11043}11044}1104511046// Make a full tree of instructions to build a SPIR-V specialization constant,11047// or regular constant if possible.11048//11049// TBD: this is not yet done, nor verified to be the best design, it does do the leaf symbols though11050//11051// Recursively walk the nodes. The nodes form a tree whose leaves are11052// regular constants, which themselves are trees that createSpvConstant()11053// recursively walks. So, this function walks the "top" of the tree:11054// - emit specialization constant-building instructions for specConstant11055// - when running into a non-spec-constant, switch to createSpvConstant()11056spv::Id TGlslangToSpvTraverser::createSpvConstant(const glslang::TIntermTyped& node)11057{11058assert(node.getQualifier().isConstant());1105911060// Handle front-end constants first (non-specialization constants).11061if (! node.getQualifier().specConstant) {11062// hand off to the non-spec-constant path11063assert(node.getAsConstantUnion() != nullptr || node.getAsSymbolNode() != nullptr);11064int nextConst = 0;11065return createSpvConstantFromConstUnionArray(node.getType(), node.getAsConstantUnion() ?11066node.getAsConstantUnion()->getConstArray() : node.getAsSymbolNode()->getConstArray(),11067nextConst, false);11068}1106911070// We now know we have a specialization constant to build1107111072// Extra capabilities may be needed.11073if (node.getType().contains8BitInt())11074builder.addCapability(spv::Capability::Int8);11075if (node.getType().contains16BitFloat())11076builder.addCapability(spv::Capability::Float16);11077if (node.getType().contains16BitInt())11078builder.addCapability(spv::Capability::Int16);11079if (node.getType().contains64BitInt())11080builder.addCapability(spv::Capability::Int64);11081if (node.getType().containsDouble())11082builder.addCapability(spv::Capability::Float64);1108311084// gl_WorkGroupSize is a special case until the front-end handles hierarchical specialization constants,11085// even then, it's specialization ids are handled by special case syntax in GLSL: layout(local_size_x = ...11086if (node.getType().getQualifier().builtIn == glslang::EbvWorkGroupSize) {11087std::vector<spv::Id> dimConstId;11088for (int dim = 0; dim < 3; ++dim) {11089bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);11090dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));11091if (specConst) {11092builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,11093glslangIntermediate->getLocalSizeSpecId(dim));11094}11095}11096return builder.makeCompositeConstant(builder.makeVectorType(builder.makeUintType(32), 3), dimConstId, true);11097}1109811099// An AST node labelled as specialization constant should be a symbol node.11100// Its initializer should either be a sub tree with constant nodes, or a constant union array.11101if (auto* sn = node.getAsSymbolNode()) {11102spv::Id result;11103if (auto* sub_tree = sn->getConstSubtree()) {11104// Traverse the constant constructor sub tree like generating normal run-time instructions.11105// During the AST traversal, if the node is marked as 'specConstant', SpecConstantOpModeGuard11106// will set the builder into spec constant op instruction generating mode.11107sub_tree->traverse(this);11108result = accessChainLoad(sub_tree->getType());11109} else if (auto* const_union_array = &sn->getConstArray()) {11110int nextConst = 0;11111result = createSpvConstantFromConstUnionArray(sn->getType(), *const_union_array, nextConst, true);11112} else {11113logger->missingFunctionality("Invalid initializer for spec constant.");11114return spv::NoResult;11115}11116builder.addName(result, sn->getName().c_str());11117return result;11118}1111911120// Neither a front-end constant node, nor a specialization constant node with constant union array or11121// constant sub tree as initializer.11122logger->missingFunctionality("Neither a front-end constant nor a spec constant.");11123return spv::NoResult;11124}1112511126// Use 'consts' as the flattened glslang source of scalar constants to recursively11127// build the aggregate SPIR-V constant.11128//11129// If there are not enough elements present in 'consts', 0 will be substituted;11130// an empty 'consts' can be used to create a fully zeroed SPIR-V constant.11131//11132spv::Id TGlslangToSpvTraverser::createSpvConstantFromConstUnionArray(const glslang::TType& glslangType,11133const glslang::TConstUnionArray& consts, int& nextConst, bool specConstant)11134{11135// vector of constants for SPIR-V11136std::vector<spv::Id> spvConsts;1113711138// Type is used for struct and array constants11139spv::Id typeId = convertGlslangToSpvType(glslangType);1114011141if (glslangType.isArray()) {11142glslang::TType elementType(glslangType, 0);11143for (int i = 0; i < glslangType.getOuterArraySize(); ++i)11144spvConsts.push_back(createSpvConstantFromConstUnionArray(elementType, consts, nextConst, false));11145} else if (glslangType.isMatrix()) {11146glslang::TType vectorType(glslangType, 0);11147for (int col = 0; col < glslangType.getMatrixCols(); ++col)11148spvConsts.push_back(createSpvConstantFromConstUnionArray(vectorType, consts, nextConst, false));11149} else if (glslangType.isCoopMat()) {11150glslang::TType componentType(glslangType.getBasicType());11151spvConsts.push_back(createSpvConstantFromConstUnionArray(componentType, consts, nextConst, false));11152} else if (glslangType.isStruct()) {11153glslang::TVector<glslang::TTypeLoc>::const_iterator iter;11154for (iter = glslangType.getStruct()->begin(); iter != glslangType.getStruct()->end(); ++iter)11155spvConsts.push_back(createSpvConstantFromConstUnionArray(*iter->type, consts, nextConst, false));11156} else if (glslangType.getVectorSize() > 1 || glslangType.isCoopVecNV()) {11157unsigned int numComponents = glslangType.isCoopVecNV() ? glslangType.getTypeParameters()->arraySizes->getDimSize(0) : glslangType.getVectorSize();11158for (unsigned int i = 0; i < numComponents; ++i) {11159bool zero = nextConst >= consts.size();11160switch (glslangType.getBasicType()) {11161case glslang::EbtInt:11162spvConsts.push_back(builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst()));11163break;11164case glslang::EbtUint:11165spvConsts.push_back(builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst()));11166break;11167case glslang::EbtFloat:11168spvConsts.push_back(builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst()));11169break;11170case glslang::EbtBool:11171spvConsts.push_back(builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst()));11172break;11173case glslang::EbtInt8:11174builder.addCapability(spv::Capability::Int8);11175spvConsts.push_back(builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const()));11176break;11177case glslang::EbtUint8:11178builder.addCapability(spv::Capability::Int8);11179spvConsts.push_back(builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const()));11180break;11181case glslang::EbtInt16:11182builder.addCapability(spv::Capability::Int16);11183spvConsts.push_back(builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const()));11184break;11185case glslang::EbtUint16:11186builder.addCapability(spv::Capability::Int16);11187spvConsts.push_back(builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const()));11188break;11189case glslang::EbtInt64:11190spvConsts.push_back(builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const()));11191break;11192case glslang::EbtUint64:11193spvConsts.push_back(builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const()));11194break;11195case glslang::EbtDouble:11196spvConsts.push_back(builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst()));11197break;11198case glslang::EbtFloat16:11199builder.addCapability(spv::Capability::Float16);11200spvConsts.push_back(builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));11201break;11202case glslang::EbtBFloat16:11203spvConsts.push_back(builder.makeBFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));11204break;11205case glslang::EbtFloatE5M2:11206spvConsts.push_back(builder.makeFloatE5M2Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));11207break;11208case glslang::EbtFloatE4M3:11209spvConsts.push_back(builder.makeFloatE4M3Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));11210break;11211default:11212assert(0);11213break;11214}11215++nextConst;11216}11217} else {11218// we have a non-aggregate (scalar) constant11219bool zero = nextConst >= consts.size();11220spv::Id scalar = 0;11221switch (glslangType.getBasicType()) {11222case glslang::EbtInt:11223scalar = builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst(), specConstant);11224break;11225case glslang::EbtUint:11226scalar = builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst(), specConstant);11227break;11228case glslang::EbtFloat:11229scalar = builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);11230break;11231case glslang::EbtBool:11232scalar = builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst(), specConstant);11233break;11234case glslang::EbtInt8:11235builder.addCapability(spv::Capability::Int8);11236scalar = builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const(), specConstant);11237break;11238case glslang::EbtUint8:11239builder.addCapability(spv::Capability::Int8);11240scalar = builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const(), specConstant);11241break;11242case glslang::EbtInt16:11243builder.addCapability(spv::Capability::Int16);11244scalar = builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const(), specConstant);11245break;11246case glslang::EbtUint16:11247builder.addCapability(spv::Capability::Int16);11248scalar = builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const(), specConstant);11249break;11250case glslang::EbtInt64:11251scalar = builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const(), specConstant);11252break;11253case glslang::EbtUint64:11254scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);11255break;11256case glslang::EbtDouble:11257scalar = builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst(), specConstant);11258break;11259case glslang::EbtFloat16:11260builder.addCapability(spv::Capability::Float16);11261scalar = builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);11262break;11263case glslang::EbtBFloat16:11264scalar = builder.makeBFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);11265break;11266case glslang::EbtFloatE5M2:11267scalar = builder.makeFloatE5M2Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);11268break;11269case glslang::EbtFloatE4M3:11270scalar = builder.makeFloatE4M3Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);11271break;11272case glslang::EbtReference:11273scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);11274scalar = builder.createUnaryOp(spv::Op::OpBitcast, typeId, scalar);11275break;11276case glslang::EbtString:11277scalar = builder.getStringId(consts[nextConst].getSConst()->c_str());11278break;11279default:11280assert(0);11281break;11282}11283++nextConst;11284return scalar;11285}1128611287return builder.makeCompositeConstant(typeId, spvConsts);11288}1128911290// Return true if the node is a constant or symbol whose reading has no11291// non-trivial observable cost or effect.11292bool TGlslangToSpvTraverser::isTrivialLeaf(const glslang::TIntermTyped* node)11293{11294// don't know what this is11295if (node == nullptr)11296return false;1129711298// a constant is safe11299if (node->getAsConstantUnion() != nullptr)11300return true;1130111302// not a symbol means non-trivial11303if (node->getAsSymbolNode() == nullptr)11304return false;1130511306// a symbol, depends on what's being read11307switch (node->getType().getQualifier().storage) {11308case glslang::EvqTemporary:11309case glslang::EvqGlobal:11310case glslang::EvqIn:11311case glslang::EvqInOut:11312case glslang::EvqConst:11313case glslang::EvqConstReadOnly:11314case glslang::EvqUniform:11315return true;11316default:11317return false;11318}11319}1132011321// A node is trivial if it is a single operation with no side effects.11322// HLSL (and/or vectors) are always trivial, as it does not short circuit.11323// Otherwise, error on the side of saying non-trivial.11324// Return true if trivial.11325bool TGlslangToSpvTraverser::isTrivial(const glslang::TIntermTyped* node)11326{11327if (node == nullptr)11328return false;1132911330// count non scalars as trivial, as well as anything coming from HLSL11331if (! node->getType().isScalarOrVec1() || glslangIntermediate->getSource() == glslang::EShSourceHlsl)11332return true;1133311334// symbols and constants are trivial11335if (isTrivialLeaf(node))11336return true;1133711338// otherwise, it needs to be a simple operation or one or two leaf nodes1133911340// not a simple operation11341const glslang::TIntermBinary* binaryNode = node->getAsBinaryNode();11342const glslang::TIntermUnary* unaryNode = node->getAsUnaryNode();11343if (binaryNode == nullptr && unaryNode == nullptr)11344return false;1134511346// not on leaf nodes11347if (binaryNode && (! isTrivialLeaf(binaryNode->getLeft()) || ! isTrivialLeaf(binaryNode->getRight())))11348return false;1134911350if (unaryNode && ! isTrivialLeaf(unaryNode->getOperand())) {11351return false;11352}1135311354if (IsOpNumericConv(node->getAsOperator()->getOp()) &&11355node->getType().getBasicType() == glslang::EbtBool) {11356return true;11357}1135811359switch (node->getAsOperator()->getOp()) {11360case glslang::EOpLogicalNot:11361case glslang::EOpEqual:11362case glslang::EOpNotEqual:11363case glslang::EOpLessThan:11364case glslang::EOpGreaterThan:11365case glslang::EOpLessThanEqual:11366case glslang::EOpGreaterThanEqual:11367case glslang::EOpIndexDirect:11368case glslang::EOpIndexDirectStruct:11369case glslang::EOpLogicalXor:11370case glslang::EOpAny:11371case glslang::EOpAll:11372return true;11373default:11374return false;11375}11376}1137711378// Emit short-circuiting code, where 'right' is never evaluated unless11379// the left side is true (for &&) or false (for ||).11380spv::Id TGlslangToSpvTraverser::createShortCircuit(glslang::TOperator op, glslang::TIntermTyped& left,11381glslang::TIntermTyped& right)11382{11383spv::Id boolTypeId = builder.makeBoolType();1138411385// emit left operand11386builder.clearAccessChain();11387left.traverse(this);11388spv::Id leftId = accessChainLoad(left.getType());1138911390// Operands to accumulate OpPhi operands11391std::vector<spv::Id> phiOperands;11392phiOperands.reserve(4);11393// accumulate left operand's phi information11394phiOperands.push_back(leftId);11395phiOperands.push_back(builder.getBuildPoint()->getId());1139611397// Make the two kinds of operation symmetric with a "!"11398// || => emit "if (! left) result = right"11399// && => emit "if ( left) result = right"11400//11401// TODO: this runtime "not" for || could be avoided by adding functionality11402// to 'builder' to have an "else" without an "then"11403if (op == glslang::EOpLogicalOr)11404leftId = builder.createUnaryOp(spv::Op::OpLogicalNot, boolTypeId, leftId);1140511406// make an "if" based on the left value11407spv::Builder::If ifBuilder(leftId, spv::SelectionControlMask::MaskNone, builder);1140811409// emit right operand as the "then" part of the "if"11410builder.clearAccessChain();11411right.traverse(this);11412spv::Id rightId = accessChainLoad(right.getType());1141311414// accumulate left operand's phi information11415phiOperands.push_back(rightId);11416phiOperands.push_back(builder.getBuildPoint()->getId());1141711418// finish the "if"11419ifBuilder.makeEndIf();1142011421// phi together the two results11422return builder.createOp(spv::Op::OpPhi, boolTypeId, phiOperands);11423}1142411425// Return type Id of the imported set of extended instructions corresponds to the name.11426// Import this set if it has not been imported yet.11427spv::Id TGlslangToSpvTraverser::getExtBuiltins(const char* name)11428{11429if (extBuiltinMap.find(name) != extBuiltinMap.end())11430return extBuiltinMap[name];11431else {11432spv::Id extBuiltins = builder.import(name);11433extBuiltinMap[name] = extBuiltins;11434return extBuiltins;11435}11436}1143711438} // end anonymous namespace1143911440namespace glslang {1144111442void GetSpirvVersion(std::string& version)11443{11444const int bufSize = 100;11445char buf[bufSize];11446snprintf(buf, bufSize, "0x%08x, Revision %d", spv::Version, spv::Revision);11447version = buf;11448}1144911450// For low-order part of the generator's magic number. Bump up11451// when there is a change in the style (e.g., if SSA form changes,11452// or a different instruction sequence to do something gets used).11453int GetSpirvGeneratorVersion()11454{11455// return 1; // start11456// return 2; // EOpAtomicCounterDecrement gets a post decrement, to map between GLSL -> SPIR-V11457// return 3; // change/correct barrier-instruction operands, to match memory model group decisions11458// return 4; // some deeper access chains: for dynamic vector component, and local Boolean component11459// return 5; // make OpArrayLength result type be an int with signedness of 011460// return 6; // revert version 5 change, which makes a different (new) kind of incorrect code,11461// versions 4 and 6 each generate OpArrayLength as it has long been done11462// return 7; // GLSL volatile keyword maps to both SPIR-V decorations Volatile and Coherent11463// return 8; // switch to new dead block eliminator; use OpUnreachable11464// return 9; // don't include opaque function parameters in OpEntryPoint global's operand list11465// return 10; // Generate OpFUnordNotEqual for != comparisons11466return 11; // Make OpEmitMeshTasksEXT a terminal instruction11467}1146811469// Write SPIR-V out to a binary file11470bool OutputSpvBin(const std::vector<unsigned int>& spirv, const char* baseName)11471{11472std::ofstream out;11473out.open(baseName, std::ios::binary | std::ios::out);11474if (out.fail()) {11475printf("ERROR: Failed to open file: %s\n", baseName);11476return false;11477}11478for (int i = 0; i < (int)spirv.size(); ++i) {11479unsigned int word = spirv[i];11480out.write((const char*)&word, 4);11481}11482out.close();11483return true;11484}1148511486// Write SPIR-V out to a text file with 32-bit hexadecimal words11487bool OutputSpvHex(const std::vector<unsigned int>& spirv, const char* baseName, const char* varName)11488{11489std::ofstream out;11490out.open(baseName, std::ios::binary | std::ios::out);11491if (out.fail()) {11492printf("ERROR: Failed to open file: %s\n", baseName);11493return false;11494}11495out << "\t// " <<11496GetSpirvGeneratorVersion() <<11497GLSLANG_VERSION_MAJOR << "." << GLSLANG_VERSION_MINOR << "." << GLSLANG_VERSION_PATCH <<11498GLSLANG_VERSION_FLAVOR << std::endl;11499if (varName != nullptr) {11500out << "\t #pragma once" << std::endl;11501out << "const uint32_t " << varName << "[] = {" << std::endl;11502}11503const int WORDS_PER_LINE = 8;11504for (int i = 0; i < (int)spirv.size(); i += WORDS_PER_LINE) {11505out << "\t";11506for (int j = 0; j < WORDS_PER_LINE && i + j < (int)spirv.size(); ++j) {11507const unsigned int word = spirv[i + j];11508out << "0x" << std::hex << std::setw(8) << std::setfill('0') << word;11509if (i + j + 1 < (int)spirv.size()) {11510out << ",";11511}11512}11513out << std::endl;11514}11515if (varName != nullptr) {11516out << "};";11517out << std::endl;11518}11519out.close();11520return true;11521}1152211523//11524// Set up the glslang traversal11525//11526void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv, SpvOptions* options)11527{11528spv::SpvBuildLogger logger;11529GlslangToSpv(intermediate, spirv, &logger, options);11530}1153111532void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv,11533spv::SpvBuildLogger* logger, SpvOptions* options)11534{11535TIntermNode* root = intermediate.getTreeRoot();1153611537if (root == nullptr)11538return;1153911540SpvOptions defaultOptions;11541if (options == nullptr)11542options = &defaultOptions;1154311544GetThreadPoolAllocator().push();1154511546TGlslangToSpvTraverser it(intermediate.getSpv().spv, &intermediate, logger, *options);11547root->traverse(&it);11548it.finishSpv(options->compileOnly);11549it.dumpSpv(spirv);1155011551#if ENABLE_OPT11552// If from HLSL, run spirv-opt to "legalize" the SPIR-V for Vulkan11553// eg. forward and remove memory writes of opaque types.11554bool prelegalization = intermediate.getSource() == EShSourceHlsl;11555if ((prelegalization || options->optimizeSize) && !options->disableOptimizer) {11556SpirvToolsTransform(intermediate, spirv, logger, options);11557prelegalization = false;11558}11559else if (options->stripDebugInfo) {11560// Strip debug info even if optimization is disabled.11561SpirvToolsStripDebugInfo(intermediate, spirv, logger);11562}1156311564if (options->validate)11565SpirvToolsValidate(intermediate, spirv, logger, prelegalization);1156611567if (options->disassemble)11568SpirvToolsDisassemble(std::cout, spirv);1156911570#endif1157111572GetThreadPoolAllocator().pop();11573}1157411575} // end namespace glslang115761157711578