Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
godotengine
GitHub Repository: godotengine/godot
Path: blob/master/thirdparty/glslang/SPIRV/GlslangToSpv.cpp
21917 views
1
//
2
// Copyright (C) 2014-2016 LunarG, Inc.
3
// Copyright (C) 2015-2020 Google, Inc.
4
// Copyright (C) 2017, 2022-2025 Arm Limited.
5
// Modifications Copyright (C) 2020 Advanced Micro Devices, Inc. All rights reserved.
6
//
7
// All rights reserved.
8
//
9
// Redistribution and use in source and binary forms, with or without
10
// modification, are permitted provided that the following conditions
11
// are met:
12
//
13
// Redistributions of source code must retain the above copyright
14
// notice, this list of conditions and the following disclaimer.
15
//
16
// Redistributions in binary form must reproduce the above
17
// copyright notice, this list of conditions and the following
18
// disclaimer in the documentation and/or other materials provided
19
// with the distribution.
20
//
21
// Neither the name of 3Dlabs Inc. Ltd. nor the names of its
22
// contributors may be used to endorse or promote products derived
23
// from this software without specific prior written permission.
24
//
25
// THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
26
// "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
27
// LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS
28
// FOR A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE
29
// COPYRIGHT HOLDERS OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT,
30
// INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING,
31
// BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES;
32
// LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER
33
// CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT
34
// LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN
35
// ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
36
// POSSIBILITY OF SUCH DAMAGE.
37
38
//
39
// Visit the nodes in the glslang intermediate tree representation to
40
// translate them to SPIR-V.
41
//
42
43
#include "spirv.hpp11"
44
#include "GlslangToSpv.h"
45
#include "SpvBuilder.h"
46
#include "SpvTools.h"
47
#include "spvUtil.h"
48
49
namespace spv {
50
#include "GLSL.std.450.h"
51
#include "GLSL.ext.KHR.h"
52
#include "GLSL.ext.EXT.h"
53
#include "GLSL.ext.AMD.h"
54
#include "GLSL.ext.NV.h"
55
#include "GLSL.ext.ARM.h"
56
#include "GLSL.ext.QCOM.h"
57
#include "NonSemanticDebugPrintf.h"
58
}
59
60
// Glslang includes
61
#include "../glslang/MachineIndependent/localintermediate.h"
62
#include "../glslang/MachineIndependent/SymbolTable.h"
63
#include "../glslang/Include/Common.h"
64
65
// Build-time generated includes
66
#include "glslang/build_info.h"
67
68
#include <fstream>
69
#include <iomanip>
70
#include <list>
71
#include <map>
72
#include <optional>
73
#include <stack>
74
#include <string>
75
#include <vector>
76
77
namespace {
78
79
namespace {
80
class SpecConstantOpModeGuard {
81
public:
82
SpecConstantOpModeGuard(spv::Builder* builder)
83
: builder_(builder) {
84
previous_flag_ = builder->isInSpecConstCodeGenMode();
85
}
86
~SpecConstantOpModeGuard() {
87
previous_flag_ ? builder_->setToSpecConstCodeGenMode()
88
: builder_->setToNormalCodeGenMode();
89
}
90
void turnOnSpecConstantOpMode() {
91
builder_->setToSpecConstCodeGenMode();
92
}
93
94
private:
95
spv::Builder* builder_;
96
bool previous_flag_;
97
};
98
99
struct OpDecorations {
100
public:
101
OpDecorations(spv::Decoration precision, spv::Decoration noContraction, spv::Decoration nonUniform) :
102
precision(precision)
103
,
104
noContraction(noContraction),
105
nonUniform(nonUniform)
106
{ }
107
108
spv::Decoration precision;
109
110
void addNoContraction(spv::Builder& builder, spv::Id t) { builder.addDecoration(t, noContraction); }
111
void addNonUniform(spv::Builder& builder, spv::Id t) { builder.addDecoration(t, nonUniform); }
112
protected:
113
spv::Decoration noContraction;
114
spv::Decoration nonUniform;
115
};
116
117
} // namespace
118
119
//
120
// The main holder of information for translating glslang to SPIR-V.
121
//
122
// Derives from the AST walking base class.
123
//
124
class TGlslangToSpvTraverser : public glslang::TIntermTraverser {
125
public:
126
TGlslangToSpvTraverser(unsigned int spvVersion, const glslang::TIntermediate*, spv::SpvBuildLogger* logger,
127
glslang::SpvOptions& options);
128
virtual ~TGlslangToSpvTraverser() { }
129
130
bool visitAggregate(glslang::TVisit, glslang::TIntermAggregate*) override;
131
bool visitBinary(glslang::TVisit, glslang::TIntermBinary*) override;
132
void visitConstantUnion(glslang::TIntermConstantUnion*) override;
133
bool visitSelection(glslang::TVisit, glslang::TIntermSelection*) override;
134
bool visitSwitch(glslang::TVisit, glslang::TIntermSwitch*) override;
135
void visitSymbol(glslang::TIntermSymbol* symbol) override;
136
bool visitUnary(glslang::TVisit, glslang::TIntermUnary*) override;
137
bool visitLoop(glslang::TVisit, glslang::TIntermLoop*) override;
138
bool visitBranch(glslang::TVisit visit, glslang::TIntermBranch*) override;
139
bool visitVariableDecl(glslang::TVisit, glslang::TIntermVariableDecl*) override;
140
141
void finishSpv(bool compileOnly);
142
void dumpSpv(std::vector<unsigned int>& out);
143
144
protected:
145
TGlslangToSpvTraverser(TGlslangToSpvTraverser&);
146
TGlslangToSpvTraverser& operator=(TGlslangToSpvTraverser&);
147
148
spv::Decoration TranslateInterpolationDecoration(const glslang::TQualifier& qualifier);
149
spv::Decoration TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier);
150
spv::Decoration TranslateNonUniformDecoration(const glslang::TQualifier& qualifier);
151
spv::Decoration TranslateNonUniformDecoration(const spv::Builder::AccessChain::CoherentFlags& coherentFlags);
152
spv::Builder::AccessChain::CoherentFlags TranslateCoherent(const glslang::TType& type);
153
spv::MemoryAccessMask TranslateMemoryAccess(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
154
spv::ImageOperandsMask TranslateImageOperands(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
155
spv::Scope TranslateMemoryScope(const spv::Builder::AccessChain::CoherentFlags &coherentFlags);
156
spv::BuiltIn TranslateBuiltInDecoration(glslang::TBuiltInVariable, bool memberDeclaration);
157
spv::ImageFormat TranslateImageFormat(const glslang::TType& type);
158
spv::SelectionControlMask TranslateSelectionControl(const glslang::TIntermSelection&) const;
159
spv::SelectionControlMask TranslateSwitchControl(const glslang::TIntermSwitch&) const;
160
spv::LoopControlMask TranslateLoopControl(const glslang::TIntermLoop&, std::vector<unsigned int>& operands) const;
161
spv::StorageClass TranslateStorageClass(const glslang::TType&);
162
void TranslateLiterals(const glslang::TVector<const glslang::TIntermConstantUnion*>&, std::vector<unsigned>&) const;
163
void addIndirectionIndexCapabilities(const glslang::TType& baseType, const glslang::TType& indexType);
164
spv::Id createSpvVariable(const glslang::TIntermSymbol*, spv::Id forcedType);
165
spv::Id getSampledType(const glslang::TSampler&);
166
spv::Id getInvertedSwizzleType(const glslang::TIntermTyped&);
167
spv::Id createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped&, spv::Id parentResult);
168
void convertSwizzle(const glslang::TIntermAggregate&, std::vector<unsigned>& swizzle);
169
spv::Id convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly = false);
170
spv::Id convertGlslangToSpvType(const glslang::TType& type, glslang::TLayoutPacking, const glslang::TQualifier&,
171
bool lastBufferBlockMember, bool forwardReferenceOnly = false);
172
void applySpirvDecorate(const glslang::TType& type, spv::Id id, std::optional<int> member);
173
bool filterMember(const glslang::TType& member);
174
spv::Id convertGlslangStructToSpvType(const glslang::TType&, const glslang::TTypeList* glslangStruct,
175
glslang::TLayoutPacking, const glslang::TQualifier&);
176
spv::LinkageType convertGlslangLinkageToSpv(glslang::TLinkType glslangLinkType);
177
void decorateStructType(const glslang::TType&, const glslang::TTypeList* glslangStruct, glslang::TLayoutPacking,
178
const glslang::TQualifier&, spv::Id, const std::vector<spv::Id>& spvMembers);
179
spv::Id makeArraySizeId(const glslang::TArraySizes&, int dim, bool allowZero = false, bool boolType = false);
180
spv::Id accessChainLoad(const glslang::TType& type);
181
void accessChainStore(const glslang::TType& type, spv::Id rvalue);
182
void multiTypeStore(const glslang::TType&, spv::Id rValue);
183
spv::Id convertLoadedBoolInUniformToUint(const glslang::TType& type, spv::Id nominalTypeId, spv::Id loadedId);
184
glslang::TLayoutPacking getExplicitLayout(const glslang::TType& type) const;
185
int getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking, glslang::TLayoutMatrix);
186
int getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking, glslang::TLayoutMatrix);
187
void updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType, int& currentOffset,
188
int& nextOffset, glslang::TLayoutPacking, glslang::TLayoutMatrix);
189
void declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember);
190
191
bool isShaderEntryPoint(const glslang::TIntermAggregate* node);
192
bool writableParam(glslang::TStorageQualifier) const;
193
bool originalParam(glslang::TStorageQualifier, const glslang::TType&, bool implicitThisParam);
194
void makeFunctions(const glslang::TIntermSequence&);
195
void makeGlobalInitializers(const glslang::TIntermSequence&);
196
void collectRayTracingLinkerObjects();
197
void visitFunctions(const glslang::TIntermSequence&);
198
void translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments,
199
spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags);
200
void translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments);
201
spv::Id createImageTextureFunctionCall(glslang::TIntermOperator* node);
202
spv::Id handleUserFunctionCall(const glslang::TIntermAggregate*);
203
204
spv::Id createBinaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right,
205
glslang::TBasicType typeProxy, bool reduceComparison = true);
206
spv::Id createBinaryMatrixOperation(spv::Op, OpDecorations&, spv::Id typeId, spv::Id left, spv::Id right);
207
spv::Id createUnaryOperation(glslang::TOperator op, OpDecorations&, spv::Id typeId, spv::Id operand,
208
glslang::TBasicType typeProxy,
209
const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
210
const glslang::TType &opType);
211
spv::Id createUnaryMatrixOperation(spv::Op op, OpDecorations&, spv::Id typeId, spv::Id operand,
212
glslang::TBasicType typeProxy);
213
spv::Id createConversion(glslang::TOperator op, OpDecorations&, spv::Id destTypeId, spv::Id operand,
214
glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType);
215
spv::Id createIntWidthConversion(spv::Id operand, int vectorSize, spv::Id destType,
216
glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType);
217
spv::Id makeSmearedConstant(spv::Id constant, int vectorSize);
218
spv::Id createAtomicOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId,
219
std::vector<spv::Id>& operands, glslang::TBasicType typeProxy,
220
const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
221
const glslang::TType &opType);
222
spv::Id createInvocationsOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands,
223
glslang::TBasicType typeProxy);
224
spv::Id CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,
225
spv::Id typeId, std::vector<spv::Id>& operands);
226
spv::Id createSubgroupOperation(glslang::TOperator op, spv::Id typeId, std::vector<spv::Id>& operands,
227
glslang::TBasicType typeProxy);
228
spv::Id createMiscOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId,
229
std::vector<spv::Id>& operands, glslang::TBasicType typeProxy);
230
spv::Id createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId);
231
spv::Id getSymbolId(const glslang::TIntermSymbol* node);
232
void addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier & qualifier);
233
bool hasQCOMImageProceessingDecoration(spv::Id id, spv::Decoration decor);
234
void addImageProcessingQCOMDecoration(spv::Id id, spv::Decoration decor);
235
void addImageProcessing2QCOMDecoration(spv::Id id, bool isForGather);
236
spv::Id createSpvConstant(const glslang::TIntermTyped&);
237
spv::Id createSpvConstantFromConstUnionArray(const glslang::TType& type, const glslang::TConstUnionArray&,
238
int& nextConst, bool specConstant);
239
bool isTrivialLeaf(const glslang::TIntermTyped* node);
240
bool isTrivial(const glslang::TIntermTyped* node);
241
spv::Id createShortCircuit(glslang::TOperator, glslang::TIntermTyped& left, glslang::TIntermTyped& right);
242
spv::Id getExtBuiltins(const char* name);
243
std::pair<spv::Id, spv::Id> getForcedType(glslang::TBuiltInVariable builtIn, const glslang::TType&);
244
spv::Id translateForcedType(spv::Id object);
245
spv::Id createCompositeConstruct(spv::Id typeId, std::vector<spv::Id> constituents);
246
247
glslang::SpvOptions& options;
248
spv::Function* shaderEntry;
249
spv::Function* currentFunction;
250
spv::Instruction* entryPoint;
251
int sequenceDepth;
252
253
spv::SpvBuildLogger* logger;
254
255
// There is a 1:1 mapping between a spv builder and a module; this is thread safe
256
spv::Builder builder;
257
bool inEntryPoint;
258
bool entryPointTerminated;
259
bool linkageOnly; // true when visiting the set of objects in the AST present only for
260
// establishing interface, whether or not they were statically used
261
std::set<spv::Id> iOSet; // all input/output variables from either static use or declaration of interface
262
const glslang::TIntermediate* glslangIntermediate;
263
bool nanMinMaxClamp; // true if use NMin/NMax/NClamp instead of FMin/FMax/FClamp
264
spv::Id stdBuiltins;
265
spv::Id nonSemanticDebugPrintf;
266
std::unordered_map<std::string, spv::Id> extBuiltinMap;
267
268
std::unordered_map<long long, spv::Id> symbolValues;
269
std::unordered_map<uint32_t, spv::Id> builtInVariableIds;
270
std::unordered_set<long long> rValueParameters; // set of formal function parameters passed as rValues,
271
// rather than a pointer
272
std::unordered_map<std::string, spv::Function*> functionMap;
273
std::unordered_map<const glslang::TTypeList*, spv::Id> structMap[glslang::ElpCount][glslang::ElmCount];
274
// for mapping glslang block indices to spv indices (e.g., due to hidden members):
275
std::unordered_map<long long, std::vector<int>> memberRemapper;
276
// for mapping glslang symbol struct to symbol Id
277
std::unordered_map<const glslang::TTypeList*, long long> glslangTypeToIdMap;
278
std::stack<bool> breakForLoop; // false means break for switch
279
std::unordered_map<std::string, const glslang::TIntermSymbol*> counterOriginator;
280
// Map pointee types for EbtReference to their forward pointers
281
std::map<const glslang::TType *, spv::Id> forwardPointers;
282
// Type forcing, for when SPIR-V wants a different type than the AST,
283
// requiring local translation to and from SPIR-V type on every access.
284
// Maps <builtin-variable-id -> AST-required-type-id>
285
std::unordered_map<spv::Id, spv::Id> forceType;
286
// Used by Task shader while generating opearnds for OpEmitMeshTasksEXT
287
spv::Id taskPayloadID;
288
// Used later for generating OpTraceKHR/OpExecuteCallableKHR/OpHitObjectRecordHit*/OpHitObjectGetShaderBindingTableData
289
std::unordered_map<unsigned int, glslang::TIntermSymbol *> locationToSymbol[4];
290
std::unordered_map<spv::Id, std::vector<spv::Decoration> > idToQCOMDecorations;
291
};
292
293
//
294
// Helper functions for translating glslang representations to SPIR-V enumerants.
295
//
296
297
// Translate glslang profile to SPIR-V source language.
298
spv::SourceLanguage TranslateSourceLanguage(glslang::EShSource source, EProfile profile)
299
{
300
switch (source) {
301
case glslang::EShSourceGlsl:
302
switch (profile) {
303
case ENoProfile:
304
case ECoreProfile:
305
case ECompatibilityProfile:
306
return spv::SourceLanguage::GLSL;
307
case EEsProfile:
308
return spv::SourceLanguage::ESSL;
309
default:
310
return spv::SourceLanguage::Unknown;
311
}
312
case glslang::EShSourceHlsl:
313
return spv::SourceLanguage::HLSL;
314
default:
315
return spv::SourceLanguage::Unknown;
316
}
317
}
318
319
// Translate glslang language (stage) to SPIR-V execution model.
320
spv::ExecutionModel TranslateExecutionModel(EShLanguage stage, bool isMeshShaderEXT = false)
321
{
322
switch (stage) {
323
case EShLangVertex: return spv::ExecutionModel::Vertex;
324
case EShLangFragment: return spv::ExecutionModel::Fragment;
325
case EShLangCompute: return spv::ExecutionModel::GLCompute;
326
case EShLangTessControl: return spv::ExecutionModel::TessellationControl;
327
case EShLangTessEvaluation: return spv::ExecutionModel::TessellationEvaluation;
328
case EShLangGeometry: return spv::ExecutionModel::Geometry;
329
case EShLangRayGen: return spv::ExecutionModel::RayGenerationKHR;
330
case EShLangIntersect: return spv::ExecutionModel::IntersectionKHR;
331
case EShLangAnyHit: return spv::ExecutionModel::AnyHitKHR;
332
case EShLangClosestHit: return spv::ExecutionModel::ClosestHitKHR;
333
case EShLangMiss: return spv::ExecutionModel::MissKHR;
334
case EShLangCallable: return spv::ExecutionModel::CallableKHR;
335
case EShLangTask: return (isMeshShaderEXT)? spv::ExecutionModel::TaskEXT : spv::ExecutionModel::TaskNV;
336
case EShLangMesh: return (isMeshShaderEXT)? spv::ExecutionModel::MeshEXT : spv::ExecutionModel::MeshNV;
337
default:
338
assert(0);
339
return spv::ExecutionModel::Fragment;
340
}
341
}
342
343
// Translate glslang sampler type to SPIR-V dimensionality.
344
spv::Dim TranslateDimensionality(const glslang::TSampler& sampler)
345
{
346
switch (sampler.dim) {
347
case glslang::Esd1D: return spv::Dim::Dim1D;
348
case glslang::Esd2D: return spv::Dim::Dim2D;
349
case glslang::Esd3D: return spv::Dim::Dim3D;
350
case glslang::EsdCube: return spv::Dim::Cube;
351
case glslang::EsdRect: return spv::Dim::Rect;
352
case glslang::EsdBuffer: return spv::Dim::Buffer;
353
case glslang::EsdSubpass: return spv::Dim::SubpassData;
354
case glslang::EsdAttachmentEXT: return spv::Dim::TileImageDataEXT;
355
default:
356
assert(0);
357
return spv::Dim::Dim2D;
358
}
359
}
360
361
// Translate glslang precision to SPIR-V precision decorations.
362
spv::Decoration TranslatePrecisionDecoration(glslang::TPrecisionQualifier glslangPrecision)
363
{
364
switch (glslangPrecision) {
365
case glslang::EpqLow: return spv::Decoration::RelaxedPrecision;
366
case glslang::EpqMedium: return spv::Decoration::RelaxedPrecision;
367
default:
368
return spv::NoPrecision;
369
}
370
}
371
372
// Translate glslang type to SPIR-V precision decorations.
373
spv::Decoration TranslatePrecisionDecoration(const glslang::TType& type)
374
{
375
return TranslatePrecisionDecoration(type.getQualifier().precision);
376
}
377
378
// Translate glslang type to SPIR-V block decorations.
379
spv::Decoration TranslateBlockDecoration(const glslang::TStorageQualifier storage, bool useStorageBuffer)
380
{
381
switch (storage) {
382
case glslang::EvqUniform: return spv::Decoration::Block;
383
case glslang::EvqBuffer: return useStorageBuffer ? spv::Decoration::Block : spv::Decoration::BufferBlock;
384
case glslang::EvqVaryingIn: return spv::Decoration::Block;
385
case glslang::EvqVaryingOut: return spv::Decoration::Block;
386
case glslang::EvqShared: return spv::Decoration::Block;
387
case glslang::EvqPayload: return spv::Decoration::Block;
388
case glslang::EvqPayloadIn: return spv::Decoration::Block;
389
case glslang::EvqHitAttr: return spv::Decoration::Block;
390
case glslang::EvqCallableData: return spv::Decoration::Block;
391
case glslang::EvqCallableDataIn: return spv::Decoration::Block;
392
case glslang::EvqHitObjectAttrNV: return spv::Decoration::Block;
393
case glslang::EvqHitObjectAttrEXT: return spv::Decoration::Block;
394
default:
395
assert(0);
396
break;
397
}
398
399
return spv::Decoration::Max;
400
}
401
402
// Translate glslang type to SPIR-V memory decorations.
403
void TranslateMemoryDecoration(const glslang::TQualifier& qualifier, std::vector<spv::Decoration>& memory,
404
bool useVulkanMemoryModel)
405
{
406
if (!useVulkanMemoryModel) {
407
if (qualifier.isVolatile()) {
408
memory.push_back(spv::Decoration::Volatile);
409
memory.push_back(spv::Decoration::Coherent);
410
} else if (qualifier.isCoherent()) {
411
memory.push_back(spv::Decoration::Coherent);
412
}
413
}
414
if (qualifier.isRestrict())
415
memory.push_back(spv::Decoration::Restrict);
416
if (qualifier.isReadOnly())
417
memory.push_back(spv::Decoration::NonWritable);
418
if (qualifier.isWriteOnly())
419
memory.push_back(spv::Decoration::NonReadable);
420
}
421
422
// Translate glslang type to SPIR-V layout decorations.
423
spv::Decoration TranslateLayoutDecoration(const glslang::TType& type, glslang::TLayoutMatrix matrixLayout)
424
{
425
if (type.isMatrix()) {
426
switch (matrixLayout) {
427
case glslang::ElmRowMajor:
428
return spv::Decoration::RowMajor;
429
case glslang::ElmColumnMajor:
430
return spv::Decoration::ColMajor;
431
default:
432
// opaque layouts don't need a majorness
433
return spv::Decoration::Max;
434
}
435
} else {
436
switch (type.getBasicType()) {
437
default:
438
return spv::Decoration::Max;
439
break;
440
case glslang::EbtBlock:
441
switch (type.getQualifier().storage) {
442
case glslang::EvqShared:
443
case glslang::EvqUniform:
444
case glslang::EvqBuffer:
445
switch (type.getQualifier().layoutPacking) {
446
case glslang::ElpShared: return spv::Decoration::GLSLShared;
447
case glslang::ElpPacked: return spv::Decoration::GLSLPacked;
448
default:
449
return spv::Decoration::Max;
450
}
451
case glslang::EvqVaryingIn:
452
case glslang::EvqVaryingOut:
453
if (type.getQualifier().isTaskMemory()) {
454
switch (type.getQualifier().layoutPacking) {
455
case glslang::ElpShared: return spv::Decoration::GLSLShared;
456
case glslang::ElpPacked: return spv::Decoration::GLSLPacked;
457
default: break;
458
}
459
} else {
460
assert(type.getQualifier().layoutPacking == glslang::ElpNone);
461
}
462
return spv::Decoration::Max;
463
case glslang::EvqPayload:
464
case glslang::EvqPayloadIn:
465
case glslang::EvqHitAttr:
466
case glslang::EvqCallableData:
467
case glslang::EvqCallableDataIn:
468
case glslang::EvqHitObjectAttrNV:
469
case glslang::EvqHitObjectAttrEXT:
470
return spv::Decoration::Max;
471
default:
472
assert(0);
473
return spv::Decoration::Max;
474
}
475
}
476
}
477
}
478
479
// Translate glslang type to SPIR-V interpolation decorations.
480
// Returns spv::Decoration::Max when no decoration
481
// should be applied.
482
spv::Decoration TGlslangToSpvTraverser::TranslateInterpolationDecoration(const glslang::TQualifier& qualifier)
483
{
484
if (qualifier.smooth)
485
// Smooth decoration doesn't exist in SPIR-V 1.0
486
return spv::Decoration::Max;
487
else if (qualifier.isNonPerspective())
488
return spv::Decoration::NoPerspective;
489
else if (qualifier.flat)
490
return spv::Decoration::Flat;
491
else if (qualifier.isExplicitInterpolation()) {
492
builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
493
return spv::Decoration::ExplicitInterpAMD;
494
}
495
else
496
return spv::Decoration::Max;
497
}
498
499
// Translate glslang type to SPIR-V auxiliary storage decorations.
500
// Returns spv::Decoration::Max when no decoration
501
// should be applied.
502
spv::Decoration TGlslangToSpvTraverser::TranslateAuxiliaryStorageDecoration(const glslang::TQualifier& qualifier)
503
{
504
if (qualifier.centroid)
505
return spv::Decoration::Centroid;
506
else if (qualifier.patch)
507
return spv::Decoration::Patch;
508
else if (qualifier.sample) {
509
builder.addCapability(spv::Capability::SampleRateShading);
510
return spv::Decoration::Sample;
511
}
512
513
return spv::Decoration::Max;
514
}
515
516
// If glslang type is invariant, return SPIR-V invariant decoration.
517
spv::Decoration TranslateInvariantDecoration(const glslang::TQualifier& qualifier)
518
{
519
if (qualifier.invariant)
520
return spv::Decoration::Invariant;
521
else
522
return spv::Decoration::Max;
523
}
524
525
// If glslang type is noContraction, return SPIR-V NoContraction decoration.
526
spv::Decoration TranslateNoContractionDecoration(const glslang::TQualifier& qualifier)
527
{
528
if (qualifier.isNoContraction())
529
return spv::Decoration::NoContraction;
530
else
531
return spv::Decoration::Max;
532
}
533
534
// If glslang type is nonUniform, return SPIR-V NonUniform decoration.
535
spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(const glslang::TQualifier& qualifier)
536
{
537
if (qualifier.isNonUniform()) {
538
builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
539
builder.addCapability(spv::Capability::ShaderNonUniformEXT);
540
return spv::Decoration::NonUniformEXT;
541
} else
542
return spv::Decoration::Max;
543
}
544
545
// If lvalue flags contains nonUniform, return SPIR-V NonUniform decoration.
546
spv::Decoration TGlslangToSpvTraverser::TranslateNonUniformDecoration(
547
const spv::Builder::AccessChain::CoherentFlags& coherentFlags)
548
{
549
if (coherentFlags.isNonUniform()) {
550
builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
551
builder.addCapability(spv::Capability::ShaderNonUniformEXT);
552
return spv::Decoration::NonUniformEXT;
553
} else
554
return spv::Decoration::Max;
555
}
556
557
spv::MemoryAccessMask TGlslangToSpvTraverser::TranslateMemoryAccess(
558
const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
559
{
560
spv::MemoryAccessMask mask = spv::MemoryAccessMask::MaskNone;
561
562
if (!glslangIntermediate->usingVulkanMemoryModel() || coherentFlags.isImage)
563
return mask;
564
565
if (coherentFlags.isVolatile() || coherentFlags.anyCoherent()) {
566
mask = mask | spv::MemoryAccessMask::MakePointerAvailableKHR |
567
spv::MemoryAccessMask::MakePointerVisibleKHR;
568
}
569
570
if (coherentFlags.nonprivate) {
571
mask = mask | spv::MemoryAccessMask::NonPrivatePointerKHR;
572
}
573
if (coherentFlags.volatil) {
574
mask = mask | spv::MemoryAccessMask::Volatile;
575
}
576
if (coherentFlags.nontemporal) {
577
mask = mask | spv::MemoryAccessMask::Nontemporal;
578
}
579
if (mask != spv::MemoryAccessMask::MaskNone) {
580
builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
581
}
582
583
return mask;
584
}
585
586
spv::ImageOperandsMask TGlslangToSpvTraverser::TranslateImageOperands(
587
const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
588
{
589
spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
590
591
if (!glslangIntermediate->usingVulkanMemoryModel())
592
return mask;
593
594
if (coherentFlags.volatil ||
595
coherentFlags.anyCoherent()) {
596
mask = mask | spv::ImageOperandsMask::MakeTexelAvailableKHR |
597
spv::ImageOperandsMask::MakeTexelVisibleKHR;
598
}
599
if (coherentFlags.nonprivate) {
600
mask = mask | spv::ImageOperandsMask::NonPrivateTexelKHR;
601
}
602
if (coherentFlags.volatil) {
603
mask = mask | spv::ImageOperandsMask::VolatileTexelKHR;
604
}
605
if (coherentFlags.nontemporal && builder.getSpvVersion() >= spv::Spv_1_6) {
606
mask = mask | spv::ImageOperandsMask::Nontemporal;
607
}
608
if (mask != spv::ImageOperandsMask::MaskNone) {
609
builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
610
}
611
612
return mask;
613
}
614
615
spv::Builder::AccessChain::CoherentFlags TGlslangToSpvTraverser::TranslateCoherent(const glslang::TType& type)
616
{
617
spv::Builder::AccessChain::CoherentFlags flags = {};
618
flags.coherent = type.getQualifier().coherent;
619
flags.devicecoherent = type.getQualifier().devicecoherent;
620
flags.queuefamilycoherent = type.getQualifier().queuefamilycoherent;
621
// shared variables are implicitly workgroupcoherent in GLSL.
622
flags.workgroupcoherent = type.getQualifier().workgroupcoherent ||
623
type.getQualifier().storage == glslang::EvqShared;
624
flags.subgroupcoherent = type.getQualifier().subgroupcoherent;
625
flags.shadercallcoherent = type.getQualifier().shadercallcoherent;
626
flags.volatil = type.getQualifier().volatil;
627
flags.nontemporal = type.getQualifier().nontemporal;
628
// *coherent variables are implicitly nonprivate in GLSL
629
flags.nonprivate = type.getQualifier().nonprivate ||
630
flags.anyCoherent() ||
631
flags.volatil;
632
flags.isImage = type.getBasicType() == glslang::EbtSampler;
633
flags.nonUniform = type.getQualifier().nonUniform;
634
return flags;
635
}
636
637
spv::Scope TGlslangToSpvTraverser::TranslateMemoryScope(
638
const spv::Builder::AccessChain::CoherentFlags &coherentFlags)
639
{
640
spv::Scope scope = spv::Scope::Max;
641
642
if (coherentFlags.volatil || coherentFlags.coherent) {
643
// coherent defaults to Device scope in the old model, QueueFamilyKHR scope in the new model
644
scope = glslangIntermediate->usingVulkanMemoryModel() ? spv::Scope::QueueFamilyKHR : spv::Scope::Device;
645
} else if (coherentFlags.devicecoherent) {
646
scope = spv::Scope::Device;
647
} else if (coherentFlags.queuefamilycoherent) {
648
scope = spv::Scope::QueueFamilyKHR;
649
} else if (coherentFlags.workgroupcoherent) {
650
scope = spv::Scope::Workgroup;
651
} else if (coherentFlags.subgroupcoherent) {
652
scope = spv::Scope::Subgroup;
653
} else if (coherentFlags.shadercallcoherent) {
654
scope = spv::Scope::ShaderCallKHR;
655
}
656
if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::Scope::Device) {
657
builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
658
}
659
660
return scope;
661
}
662
663
// Translate a glslang built-in variable to a SPIR-V built in decoration. Also generate
664
// associated capabilities when required. For some built-in variables, a capability
665
// is generated only when using the variable in an executable instruction, but not when
666
// just declaring a struct member variable with it. This is true for PointSize,
667
// ClipDistance, and CullDistance.
668
spv::BuiltIn TGlslangToSpvTraverser::TranslateBuiltInDecoration(glslang::TBuiltInVariable builtIn,
669
bool memberDeclaration)
670
{
671
switch (builtIn) {
672
case glslang::EbvPointSize:
673
// Defer adding the capability until the built-in is actually used.
674
if (! memberDeclaration) {
675
switch (glslangIntermediate->getStage()) {
676
case EShLangGeometry:
677
builder.addCapability(spv::Capability::GeometryPointSize);
678
break;
679
case EShLangTessControl:
680
case EShLangTessEvaluation:
681
builder.addCapability(spv::Capability::TessellationPointSize);
682
break;
683
default:
684
break;
685
}
686
}
687
return spv::BuiltIn::PointSize;
688
689
case glslang::EbvPosition: return spv::BuiltIn::Position;
690
case glslang::EbvVertexId: return spv::BuiltIn::VertexId;
691
case glslang::EbvInstanceId: return spv::BuiltIn::InstanceId;
692
case glslang::EbvVertexIndex: return spv::BuiltIn::VertexIndex;
693
case glslang::EbvInstanceIndex: return spv::BuiltIn::InstanceIndex;
694
695
case glslang::EbvFragCoord: return spv::BuiltIn::FragCoord;
696
case glslang::EbvPointCoord: return spv::BuiltIn::PointCoord;
697
case glslang::EbvFace: return spv::BuiltIn::FrontFacing;
698
case glslang::EbvFragDepth: return spv::BuiltIn::FragDepth;
699
700
case glslang::EbvNumWorkGroups: return spv::BuiltIn::NumWorkgroups;
701
case glslang::EbvWorkGroupSize: return spv::BuiltIn::WorkgroupSize;
702
case glslang::EbvWorkGroupId: return spv::BuiltIn::WorkgroupId;
703
case glslang::EbvLocalInvocationId: return spv::BuiltIn::LocalInvocationId;
704
case glslang::EbvLocalInvocationIndex: return spv::BuiltIn::LocalInvocationIndex;
705
case glslang::EbvGlobalInvocationId: return spv::BuiltIn::GlobalInvocationId;
706
707
// These *Distance capabilities logically belong here, but if the member is declared and
708
// then never used, consumers of SPIR-V prefer the capability not be declared.
709
// They are now generated when used, rather than here when declared.
710
// Potentially, the specification should be more clear what the minimum
711
// use needed is to trigger the capability.
712
//
713
case glslang::EbvClipDistance:
714
if (!memberDeclaration)
715
builder.addCapability(spv::Capability::ClipDistance);
716
return spv::BuiltIn::ClipDistance;
717
718
case glslang::EbvCullDistance:
719
if (!memberDeclaration)
720
builder.addCapability(spv::Capability::CullDistance);
721
return spv::BuiltIn::CullDistance;
722
723
case glslang::EbvViewportIndex:
724
if (glslangIntermediate->getStage() == EShLangGeometry ||
725
glslangIntermediate->getStage() == EShLangFragment) {
726
builder.addCapability(spv::Capability::MultiViewport);
727
}
728
if (glslangIntermediate->getStage() == EShLangVertex ||
729
glslangIntermediate->getStage() == EShLangTessControl ||
730
glslangIntermediate->getStage() == EShLangTessEvaluation) {
731
732
if (builder.getSpvVersion() < spv::Spv_1_5) {
733
builder.addIncorporatedExtension(spv::E_SPV_EXT_shader_viewport_index_layer, spv::Spv_1_5);
734
builder.addCapability(spv::Capability::ShaderViewportIndexLayerEXT);
735
}
736
else
737
builder.addCapability(spv::Capability::ShaderViewportIndex);
738
}
739
return spv::BuiltIn::ViewportIndex;
740
741
case glslang::EbvSampleId:
742
builder.addCapability(spv::Capability::SampleRateShading);
743
return spv::BuiltIn::SampleId;
744
745
case glslang::EbvSamplePosition:
746
builder.addCapability(spv::Capability::SampleRateShading);
747
return spv::BuiltIn::SamplePosition;
748
749
case glslang::EbvSampleMask:
750
return spv::BuiltIn::SampleMask;
751
752
case glslang::EbvLayer:
753
if (glslangIntermediate->getStage() == EShLangMesh) {
754
return spv::BuiltIn::Layer;
755
}
756
if (glslangIntermediate->getStage() == EShLangGeometry ||
757
glslangIntermediate->getStage() == EShLangFragment) {
758
builder.addCapability(spv::Capability::Geometry);
759
}
760
if (glslangIntermediate->getStage() == EShLangVertex ||
761
glslangIntermediate->getStage() == EShLangTessControl ||
762
glslangIntermediate->getStage() == EShLangTessEvaluation) {
763
764
if (builder.getSpvVersion() < spv::Spv_1_5) {
765
builder.addIncorporatedExtension(spv::E_SPV_EXT_shader_viewport_index_layer, spv::Spv_1_5);
766
builder.addCapability(spv::Capability::ShaderViewportIndexLayerEXT);
767
} else
768
builder.addCapability(spv::Capability::ShaderLayer);
769
}
770
return spv::BuiltIn::Layer;
771
772
case glslang::EbvBaseVertex:
773
builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
774
builder.addCapability(spv::Capability::DrawParameters);
775
return spv::BuiltIn::BaseVertex;
776
777
case glslang::EbvBaseInstance:
778
builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
779
builder.addCapability(spv::Capability::DrawParameters);
780
return spv::BuiltIn::BaseInstance;
781
782
case glslang::EbvDrawId:
783
builder.addIncorporatedExtension(spv::E_SPV_KHR_shader_draw_parameters, spv::Spv_1_3);
784
builder.addCapability(spv::Capability::DrawParameters);
785
return spv::BuiltIn::DrawIndex;
786
787
case glslang::EbvPrimitiveId:
788
if (glslangIntermediate->getStage() == EShLangFragment)
789
builder.addCapability(spv::Capability::Geometry);
790
return spv::BuiltIn::PrimitiveId;
791
792
case glslang::EbvFragStencilRef:
793
builder.addExtension(spv::E_SPV_EXT_shader_stencil_export);
794
builder.addCapability(spv::Capability::StencilExportEXT);
795
return spv::BuiltIn::FragStencilRefEXT;
796
797
case glslang::EbvShadingRateKHR:
798
builder.addExtension(spv::E_SPV_KHR_fragment_shading_rate);
799
builder.addCapability(spv::Capability::FragmentShadingRateKHR);
800
return spv::BuiltIn::ShadingRateKHR;
801
802
case glslang::EbvPrimitiveShadingRateKHR:
803
builder.addExtension(spv::E_SPV_KHR_fragment_shading_rate);
804
builder.addCapability(spv::Capability::FragmentShadingRateKHR);
805
return spv::BuiltIn::PrimitiveShadingRateKHR;
806
807
case glslang::EbvInvocationId: return spv::BuiltIn::InvocationId;
808
case glslang::EbvTessLevelInner: return spv::BuiltIn::TessLevelInner;
809
case glslang::EbvTessLevelOuter: return spv::BuiltIn::TessLevelOuter;
810
case glslang::EbvTessCoord: return spv::BuiltIn::TessCoord;
811
case glslang::EbvPatchVertices: return spv::BuiltIn::PatchVertices;
812
case glslang::EbvHelperInvocation: return spv::BuiltIn::HelperInvocation;
813
814
case glslang::EbvSubGroupSize:
815
builder.addExtension(spv::E_SPV_KHR_shader_ballot);
816
builder.addCapability(spv::Capability::SubgroupBallotKHR);
817
return spv::BuiltIn::SubgroupSize;
818
819
case glslang::EbvSubGroupInvocation:
820
builder.addExtension(spv::E_SPV_KHR_shader_ballot);
821
builder.addCapability(spv::Capability::SubgroupBallotKHR);
822
return spv::BuiltIn::SubgroupLocalInvocationId;
823
824
case glslang::EbvSubGroupEqMask:
825
builder.addExtension(spv::E_SPV_KHR_shader_ballot);
826
builder.addCapability(spv::Capability::SubgroupBallotKHR);
827
return spv::BuiltIn::SubgroupEqMask;
828
829
case glslang::EbvSubGroupGeMask:
830
builder.addExtension(spv::E_SPV_KHR_shader_ballot);
831
builder.addCapability(spv::Capability::SubgroupBallotKHR);
832
return spv::BuiltIn::SubgroupGeMask;
833
834
case glslang::EbvSubGroupGtMask:
835
builder.addExtension(spv::E_SPV_KHR_shader_ballot);
836
builder.addCapability(spv::Capability::SubgroupBallotKHR);
837
return spv::BuiltIn::SubgroupGtMask;
838
839
case glslang::EbvSubGroupLeMask:
840
builder.addExtension(spv::E_SPV_KHR_shader_ballot);
841
builder.addCapability(spv::Capability::SubgroupBallotKHR);
842
return spv::BuiltIn::SubgroupLeMask;
843
844
case glslang::EbvSubGroupLtMask:
845
builder.addExtension(spv::E_SPV_KHR_shader_ballot);
846
builder.addCapability(spv::Capability::SubgroupBallotKHR);
847
return spv::BuiltIn::SubgroupLtMask;
848
849
case glslang::EbvNumSubgroups:
850
builder.addCapability(spv::Capability::GroupNonUniform);
851
return spv::BuiltIn::NumSubgroups;
852
853
case glslang::EbvSubgroupID:
854
builder.addCapability(spv::Capability::GroupNonUniform);
855
return spv::BuiltIn::SubgroupId;
856
857
case glslang::EbvSubgroupSize2:
858
builder.addCapability(spv::Capability::GroupNonUniform);
859
return spv::BuiltIn::SubgroupSize;
860
861
case glslang::EbvSubgroupInvocation2:
862
builder.addCapability(spv::Capability::GroupNonUniform);
863
return spv::BuiltIn::SubgroupLocalInvocationId;
864
865
case glslang::EbvSubgroupEqMask2:
866
builder.addCapability(spv::Capability::GroupNonUniform);
867
builder.addCapability(spv::Capability::GroupNonUniformBallot);
868
return spv::BuiltIn::SubgroupEqMask;
869
870
case glslang::EbvSubgroupGeMask2:
871
builder.addCapability(spv::Capability::GroupNonUniform);
872
builder.addCapability(spv::Capability::GroupNonUniformBallot);
873
return spv::BuiltIn::SubgroupGeMask;
874
875
case glslang::EbvSubgroupGtMask2:
876
builder.addCapability(spv::Capability::GroupNonUniform);
877
builder.addCapability(spv::Capability::GroupNonUniformBallot);
878
return spv::BuiltIn::SubgroupGtMask;
879
880
case glslang::EbvSubgroupLeMask2:
881
builder.addCapability(spv::Capability::GroupNonUniform);
882
builder.addCapability(spv::Capability::GroupNonUniformBallot);
883
return spv::BuiltIn::SubgroupLeMask;
884
885
case glslang::EbvSubgroupLtMask2:
886
builder.addCapability(spv::Capability::GroupNonUniform);
887
builder.addCapability(spv::Capability::GroupNonUniformBallot);
888
return spv::BuiltIn::SubgroupLtMask;
889
890
case glslang::EbvBaryCoordNoPersp:
891
builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
892
return spv::BuiltIn::BaryCoordNoPerspAMD;
893
894
case glslang::EbvBaryCoordNoPerspCentroid:
895
builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
896
return spv::BuiltIn::BaryCoordNoPerspCentroidAMD;
897
898
case glslang::EbvBaryCoordNoPerspSample:
899
builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
900
return spv::BuiltIn::BaryCoordNoPerspSampleAMD;
901
902
case glslang::EbvBaryCoordSmooth:
903
builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
904
return spv::BuiltIn::BaryCoordSmoothAMD;
905
906
case glslang::EbvBaryCoordSmoothCentroid:
907
builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
908
return spv::BuiltIn::BaryCoordSmoothCentroidAMD;
909
910
case glslang::EbvBaryCoordSmoothSample:
911
builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
912
return spv::BuiltIn::BaryCoordSmoothSampleAMD;
913
914
case glslang::EbvBaryCoordPullModel:
915
builder.addExtension(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
916
return spv::BuiltIn::BaryCoordPullModelAMD;
917
918
case glslang::EbvDeviceIndex:
919
builder.addIncorporatedExtension(spv::E_SPV_KHR_device_group, spv::Spv_1_3);
920
builder.addCapability(spv::Capability::DeviceGroup);
921
return spv::BuiltIn::DeviceIndex;
922
923
case glslang::EbvViewIndex:
924
builder.addIncorporatedExtension(spv::E_SPV_KHR_multiview, spv::Spv_1_3);
925
builder.addCapability(spv::Capability::MultiView);
926
return spv::BuiltIn::ViewIndex;
927
928
case glslang::EbvFragSizeEXT:
929
builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);
930
builder.addCapability(spv::Capability::FragmentDensityEXT);
931
return spv::BuiltIn::FragSizeEXT;
932
933
case glslang::EbvFragInvocationCountEXT:
934
builder.addExtension(spv::E_SPV_EXT_fragment_invocation_density);
935
builder.addCapability(spv::Capability::FragmentDensityEXT);
936
return spv::BuiltIn::FragInvocationCountEXT;
937
938
case glslang::EbvViewportMaskNV:
939
if (!memberDeclaration) {
940
builder.addExtension(spv::E_SPV_NV_viewport_array2);
941
builder.addCapability(spv::Capability::ShaderViewportMaskNV);
942
}
943
return spv::BuiltIn::ViewportMaskNV;
944
case glslang::EbvSecondaryPositionNV:
945
if (!memberDeclaration) {
946
builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
947
builder.addCapability(spv::Capability::ShaderStereoViewNV);
948
}
949
return spv::BuiltIn::SecondaryPositionNV;
950
case glslang::EbvSecondaryViewportMaskNV:
951
if (!memberDeclaration) {
952
builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
953
builder.addCapability(spv::Capability::ShaderStereoViewNV);
954
}
955
return spv::BuiltIn::SecondaryViewportMaskNV;
956
case glslang::EbvPositionPerViewNV:
957
if (!memberDeclaration) {
958
builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);
959
builder.addCapability(spv::Capability::PerViewAttributesNV);
960
}
961
return spv::BuiltIn::PositionPerViewNV;
962
case glslang::EbvViewportMaskPerViewNV:
963
if (!memberDeclaration) {
964
builder.addExtension(spv::E_SPV_NVX_multiview_per_view_attributes);
965
builder.addCapability(spv::Capability::PerViewAttributesNV);
966
}
967
return spv::BuiltIn::ViewportMaskPerViewNV;
968
case glslang::EbvFragFullyCoveredNV:
969
builder.addExtension(spv::E_SPV_EXT_fragment_fully_covered);
970
builder.addCapability(spv::Capability::FragmentFullyCoveredEXT);
971
return spv::BuiltIn::FullyCoveredEXT;
972
case glslang::EbvFragmentSizeNV:
973
builder.addExtension(spv::E_SPV_NV_shading_rate);
974
builder.addCapability(spv::Capability::ShadingRateNV);
975
return spv::BuiltIn::FragmentSizeNV;
976
case glslang::EbvInvocationsPerPixelNV:
977
builder.addExtension(spv::E_SPV_NV_shading_rate);
978
builder.addCapability(spv::Capability::ShadingRateNV);
979
return spv::BuiltIn::InvocationsPerPixelNV;
980
981
// ray tracing
982
case glslang::EbvLaunchId:
983
return spv::BuiltIn::LaunchIdKHR;
984
case glslang::EbvLaunchSize:
985
return spv::BuiltIn::LaunchSizeKHR;
986
case glslang::EbvWorldRayOrigin:
987
return spv::BuiltIn::WorldRayOriginKHR;
988
case glslang::EbvWorldRayDirection:
989
return spv::BuiltIn::WorldRayDirectionKHR;
990
case glslang::EbvObjectRayOrigin:
991
return spv::BuiltIn::ObjectRayOriginKHR;
992
case glslang::EbvObjectRayDirection:
993
return spv::BuiltIn::ObjectRayDirectionKHR;
994
case glslang::EbvRayTmin:
995
return spv::BuiltIn::RayTminKHR;
996
case glslang::EbvRayTmax:
997
return spv::BuiltIn::RayTmaxKHR;
998
case glslang::EbvCullMask:
999
return spv::BuiltIn::CullMaskKHR;
1000
case glslang::EbvPositionFetch:
1001
return spv::BuiltIn::HitTriangleVertexPositionsKHR;
1002
case glslang::EbvInstanceCustomIndex:
1003
return spv::BuiltIn::InstanceCustomIndexKHR;
1004
case glslang::EbvHitKind:
1005
return spv::BuiltIn::HitKindKHR;
1006
case glslang::EbvObjectToWorld:
1007
case glslang::EbvObjectToWorld3x4:
1008
return spv::BuiltIn::ObjectToWorldKHR;
1009
case glslang::EbvWorldToObject:
1010
case glslang::EbvWorldToObject3x4:
1011
return spv::BuiltIn::WorldToObjectKHR;
1012
case glslang::EbvIncomingRayFlags:
1013
return spv::BuiltIn::IncomingRayFlagsKHR;
1014
case glslang::EbvGeometryIndex:
1015
return spv::BuiltIn::RayGeometryIndexKHR;
1016
case glslang::EbvCurrentRayTimeNV:
1017
builder.addExtension(spv::E_SPV_NV_ray_tracing_motion_blur);
1018
builder.addCapability(spv::Capability::RayTracingMotionBlurNV);
1019
return spv::BuiltIn::CurrentRayTimeNV;
1020
case glslang::EbvMicroTrianglePositionNV:
1021
builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
1022
builder.addExtension("SPV_NV_displacement_micromap");
1023
return spv::BuiltIn::HitMicroTriangleVertexPositionsNV;
1024
case glslang::EbvMicroTriangleBaryNV:
1025
builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
1026
builder.addExtension("SPV_NV_displacement_micromap");
1027
return spv::BuiltIn::HitMicroTriangleVertexBarycentricsNV;
1028
case glslang::EbvHitKindFrontFacingMicroTriangleNV:
1029
builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
1030
builder.addExtension("SPV_NV_displacement_micromap");
1031
return spv::BuiltIn::HitKindFrontFacingMicroTriangleNV;
1032
case glslang::EbvHitKindBackFacingMicroTriangleNV:
1033
builder.addCapability(spv::Capability::RayTracingDisplacementMicromapNV);
1034
builder.addExtension("SPV_NV_displacement_micromap");
1035
return spv::BuiltIn::HitKindBackFacingMicroTriangleNV;
1036
case glslang::EbvClusterIDNV:
1037
builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
1038
builder.addExtension("SPV_NV_cluster_acceleration_structure");
1039
return spv::BuiltIn::ClusterIDNV;
1040
case glslang::EbvHitIsSphereNV:
1041
builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
1042
builder.addExtension("SPV_NV_linear_swept_spheres");
1043
return spv::BuiltIn::HitIsSphereNV;
1044
case glslang::EbvHitIsLSSNV:
1045
builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
1046
builder.addExtension("SPV_NV_linear_swept_spheres");
1047
return spv::BuiltIn::HitIsLSSNV;
1048
case glslang::EbvHitSpherePositionNV:
1049
builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
1050
builder.addExtension("SPV_NV_linear_swept_spheres");
1051
return spv::BuiltIn::HitSpherePositionNV;
1052
case glslang::EbvHitSphereRadiusNV:
1053
builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
1054
builder.addExtension("SPV_NV_linear_swept_spheres");
1055
return spv::BuiltIn::HitSphereRadiusNV;
1056
case glslang::EbvHitLSSPositionsNV:
1057
builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
1058
builder.addExtension("SPV_NV_linear_swept_spheres");
1059
return spv::BuiltIn::HitLSSPositionsNV;
1060
case glslang::EbvHitLSSRadiiNV:
1061
builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
1062
builder.addExtension("SPV_NV_linear_swept_spheres");
1063
return spv::BuiltIn::HitLSSRadiiNV;
1064
1065
// barycentrics
1066
case glslang::EbvBaryCoordNV:
1067
builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
1068
builder.addCapability(spv::Capability::FragmentBarycentricNV);
1069
return spv::BuiltIn::BaryCoordNV;
1070
case glslang::EbvBaryCoordNoPerspNV:
1071
builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
1072
builder.addCapability(spv::Capability::FragmentBarycentricNV);
1073
return spv::BuiltIn::BaryCoordNoPerspNV;
1074
1075
case glslang::EbvBaryCoordEXT:
1076
builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
1077
builder.addCapability(spv::Capability::FragmentBarycentricKHR);
1078
return spv::BuiltIn::BaryCoordKHR;
1079
case glslang::EbvBaryCoordNoPerspEXT:
1080
builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
1081
builder.addCapability(spv::Capability::FragmentBarycentricKHR);
1082
return spv::BuiltIn::BaryCoordNoPerspKHR;
1083
1084
// mesh shaders
1085
case glslang::EbvTaskCountNV:
1086
return spv::BuiltIn::TaskCountNV;
1087
case glslang::EbvPrimitiveCountNV:
1088
return spv::BuiltIn::PrimitiveCountNV;
1089
case glslang::EbvPrimitiveIndicesNV:
1090
return spv::BuiltIn::PrimitiveIndicesNV;
1091
case glslang::EbvClipDistancePerViewNV:
1092
return spv::BuiltIn::ClipDistancePerViewNV;
1093
case glslang::EbvCullDistancePerViewNV:
1094
return spv::BuiltIn::CullDistancePerViewNV;
1095
case glslang::EbvLayerPerViewNV:
1096
return spv::BuiltIn::LayerPerViewNV;
1097
case glslang::EbvMeshViewCountNV:
1098
return spv::BuiltIn::MeshViewCountNV;
1099
case glslang::EbvMeshViewIndicesNV:
1100
return spv::BuiltIn::MeshViewIndicesNV;
1101
1102
// SPV_EXT_mesh_shader
1103
case glslang::EbvPrimitivePointIndicesEXT:
1104
return spv::BuiltIn::PrimitivePointIndicesEXT;
1105
case glslang::EbvPrimitiveLineIndicesEXT:
1106
return spv::BuiltIn::PrimitiveLineIndicesEXT;
1107
case glslang::EbvPrimitiveTriangleIndicesEXT:
1108
return spv::BuiltIn::PrimitiveTriangleIndicesEXT;
1109
case glslang::EbvCullPrimitiveEXT:
1110
return spv::BuiltIn::CullPrimitiveEXT;
1111
1112
// sm builtins
1113
case glslang::EbvWarpsPerSM:
1114
builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
1115
builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
1116
return spv::BuiltIn::WarpsPerSMNV;
1117
case glslang::EbvSMCount:
1118
builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
1119
builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
1120
return spv::BuiltIn::SMCountNV;
1121
case glslang::EbvWarpID:
1122
builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
1123
builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
1124
return spv::BuiltIn::WarpIDNV;
1125
case glslang::EbvSMID:
1126
builder.addExtension(spv::E_SPV_NV_shader_sm_builtins);
1127
builder.addCapability(spv::Capability::ShaderSMBuiltinsNV);
1128
return spv::BuiltIn::SMIDNV;
1129
1130
// ARM builtins
1131
case glslang::EbvCoreCountARM:
1132
builder.addExtension(spv::E_SPV_ARM_core_builtins);
1133
builder.addCapability(spv::Capability::CoreBuiltinsARM);
1134
return spv::BuiltIn::CoreCountARM;
1135
case glslang::EbvCoreIDARM:
1136
builder.addExtension(spv::E_SPV_ARM_core_builtins);
1137
builder.addCapability(spv::Capability::CoreBuiltinsARM);
1138
return spv::BuiltIn::CoreIDARM;
1139
case glslang::EbvCoreMaxIDARM:
1140
builder.addExtension(spv::E_SPV_ARM_core_builtins);
1141
builder.addCapability(spv::Capability::CoreBuiltinsARM);
1142
return spv::BuiltIn::CoreMaxIDARM;
1143
case glslang::EbvWarpIDARM:
1144
builder.addExtension(spv::E_SPV_ARM_core_builtins);
1145
builder.addCapability(spv::Capability::CoreBuiltinsARM);
1146
return spv::BuiltIn::WarpIDARM;
1147
case glslang::EbvWarpMaxIDARM:
1148
builder.addExtension(spv::E_SPV_ARM_core_builtins);
1149
builder.addCapability(spv::Capability::CoreBuiltinsARM);
1150
return spv::BuiltIn::WarpMaxIDARM;
1151
1152
// QCOM builtins
1153
case glslang::EbvTileOffsetQCOM:
1154
builder.addExtension(spv::E_SPV_QCOM_tile_shading);
1155
return spv::BuiltIn::TileOffsetQCOM;
1156
case glslang::EbvTileDimensionQCOM:
1157
builder.addExtension(spv::E_SPV_QCOM_tile_shading);
1158
return spv::BuiltIn::TileDimensionQCOM;
1159
case glslang::EbvTileApronSizeQCOM:
1160
builder.addExtension(spv::E_SPV_QCOM_tile_shading);
1161
return spv::BuiltIn::TileApronSizeQCOM;
1162
1163
default:
1164
return spv::BuiltIn::Max;
1165
}
1166
}
1167
1168
// Translate glslang image layout format to SPIR-V image format.
1169
spv::ImageFormat TGlslangToSpvTraverser::TranslateImageFormat(const glslang::TType& type)
1170
{
1171
assert(type.getBasicType() == glslang::EbtSampler);
1172
1173
// Check for capabilities
1174
switch (type.getQualifier().getFormat()) {
1175
case glslang::ElfRg32f:
1176
case glslang::ElfRg16f:
1177
case glslang::ElfR11fG11fB10f:
1178
case glslang::ElfR16f:
1179
case glslang::ElfRgba16:
1180
case glslang::ElfRgb10A2:
1181
case glslang::ElfRg16:
1182
case glslang::ElfRg8:
1183
case glslang::ElfR16:
1184
case glslang::ElfR8:
1185
case glslang::ElfRgba16Snorm:
1186
case glslang::ElfRg16Snorm:
1187
case glslang::ElfRg8Snorm:
1188
case glslang::ElfR16Snorm:
1189
case glslang::ElfR8Snorm:
1190
1191
case glslang::ElfRg32i:
1192
case glslang::ElfRg16i:
1193
case glslang::ElfRg8i:
1194
case glslang::ElfR16i:
1195
case glslang::ElfR8i:
1196
1197
case glslang::ElfRgb10a2ui:
1198
case glslang::ElfRg32ui:
1199
case glslang::ElfRg16ui:
1200
case glslang::ElfRg8ui:
1201
case glslang::ElfR16ui:
1202
case glslang::ElfR8ui:
1203
builder.addCapability(spv::Capability::StorageImageExtendedFormats);
1204
break;
1205
1206
case glslang::ElfR64ui:
1207
case glslang::ElfR64i:
1208
builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
1209
builder.addCapability(spv::Capability::Int64ImageEXT);
1210
break;
1211
default:
1212
break;
1213
}
1214
1215
// do the translation
1216
switch (type.getQualifier().getFormat()) {
1217
case glslang::ElfNone: return spv::ImageFormat::Unknown;
1218
case glslang::ElfRgba32f: return spv::ImageFormat::Rgba32f;
1219
case glslang::ElfRgba16f: return spv::ImageFormat::Rgba16f;
1220
case glslang::ElfR32f: return spv::ImageFormat::R32f;
1221
case glslang::ElfRgba8: return spv::ImageFormat::Rgba8;
1222
case glslang::ElfRgba8Snorm: return spv::ImageFormat::Rgba8Snorm;
1223
case glslang::ElfRg32f: return spv::ImageFormat::Rg32f;
1224
case glslang::ElfRg16f: return spv::ImageFormat::Rg16f;
1225
case glslang::ElfR11fG11fB10f: return spv::ImageFormat::R11fG11fB10f;
1226
case glslang::ElfR16f: return spv::ImageFormat::R16f;
1227
case glslang::ElfRgba16: return spv::ImageFormat::Rgba16;
1228
case glslang::ElfRgb10A2: return spv::ImageFormat::Rgb10A2;
1229
case glslang::ElfRg16: return spv::ImageFormat::Rg16;
1230
case glslang::ElfRg8: return spv::ImageFormat::Rg8;
1231
case glslang::ElfR16: return spv::ImageFormat::R16;
1232
case glslang::ElfR8: return spv::ImageFormat::R8;
1233
case glslang::ElfRgba16Snorm: return spv::ImageFormat::Rgba16Snorm;
1234
case glslang::ElfRg16Snorm: return spv::ImageFormat::Rg16Snorm;
1235
case glslang::ElfRg8Snorm: return spv::ImageFormat::Rg8Snorm;
1236
case glslang::ElfR16Snorm: return spv::ImageFormat::R16Snorm;
1237
case glslang::ElfR8Snorm: return spv::ImageFormat::R8Snorm;
1238
case glslang::ElfRgba32i: return spv::ImageFormat::Rgba32i;
1239
case glslang::ElfRgba16i: return spv::ImageFormat::Rgba16i;
1240
case glslang::ElfRgba8i: return spv::ImageFormat::Rgba8i;
1241
case glslang::ElfR32i: return spv::ImageFormat::R32i;
1242
case glslang::ElfRg32i: return spv::ImageFormat::Rg32i;
1243
case glslang::ElfRg16i: return spv::ImageFormat::Rg16i;
1244
case glslang::ElfRg8i: return spv::ImageFormat::Rg8i;
1245
case glslang::ElfR16i: return spv::ImageFormat::R16i;
1246
case glslang::ElfR8i: return spv::ImageFormat::R8i;
1247
case glslang::ElfRgba32ui: return spv::ImageFormat::Rgba32ui;
1248
case glslang::ElfRgba16ui: return spv::ImageFormat::Rgba16ui;
1249
case glslang::ElfRgba8ui: return spv::ImageFormat::Rgba8ui;
1250
case glslang::ElfR32ui: return spv::ImageFormat::R32ui;
1251
case glslang::ElfRg32ui: return spv::ImageFormat::Rg32ui;
1252
case glslang::ElfRg16ui: return spv::ImageFormat::Rg16ui;
1253
case glslang::ElfRgb10a2ui: return spv::ImageFormat::Rgb10a2ui;
1254
case glslang::ElfRg8ui: return spv::ImageFormat::Rg8ui;
1255
case glslang::ElfR16ui: return spv::ImageFormat::R16ui;
1256
case glslang::ElfR8ui: return spv::ImageFormat::R8ui;
1257
case glslang::ElfR64ui: return spv::ImageFormat::R64ui;
1258
case glslang::ElfR64i: return spv::ImageFormat::R64i;
1259
default: return spv::ImageFormat::Max;
1260
}
1261
}
1262
1263
spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSelectionControl(
1264
const glslang::TIntermSelection& selectionNode) const
1265
{
1266
if (selectionNode.getFlatten())
1267
return spv::SelectionControlMask::Flatten;
1268
if (selectionNode.getDontFlatten())
1269
return spv::SelectionControlMask::DontFlatten;
1270
return spv::SelectionControlMask::MaskNone;
1271
}
1272
1273
spv::SelectionControlMask TGlslangToSpvTraverser::TranslateSwitchControl(const glslang::TIntermSwitch& switchNode)
1274
const
1275
{
1276
if (switchNode.getFlatten())
1277
return spv::SelectionControlMask::Flatten;
1278
if (switchNode.getDontFlatten())
1279
return spv::SelectionControlMask::DontFlatten;
1280
return spv::SelectionControlMask::MaskNone;
1281
}
1282
1283
// return a non-0 dependency if the dependency argument must be set
1284
spv::LoopControlMask TGlslangToSpvTraverser::TranslateLoopControl(const glslang::TIntermLoop& loopNode,
1285
std::vector<unsigned int>& operands) const
1286
{
1287
spv::LoopControlMask control = spv::LoopControlMask::MaskNone;
1288
1289
if (loopNode.getDontUnroll())
1290
control = control | spv::LoopControlMask::DontUnroll;
1291
if (loopNode.getUnroll())
1292
control = control | spv::LoopControlMask::Unroll;
1293
if (unsigned(loopNode.getLoopDependency()) == glslang::TIntermLoop::dependencyInfinite)
1294
control = control | spv::LoopControlMask::DependencyInfinite;
1295
else if (loopNode.getLoopDependency() > 0) {
1296
control = control | spv::LoopControlMask::DependencyLength;
1297
operands.push_back((unsigned int)loopNode.getLoopDependency());
1298
}
1299
if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
1300
if (loopNode.getMinIterations() > 0) {
1301
control = control | spv::LoopControlMask::MinIterations;
1302
operands.push_back(loopNode.getMinIterations());
1303
}
1304
if (loopNode.getMaxIterations() < glslang::TIntermLoop::iterationsInfinite) {
1305
control = control | spv::LoopControlMask::MaxIterations;
1306
operands.push_back(loopNode.getMaxIterations());
1307
}
1308
if (loopNode.getIterationMultiple() > 1) {
1309
control = control | spv::LoopControlMask::IterationMultiple;
1310
operands.push_back(loopNode.getIterationMultiple());
1311
}
1312
if (loopNode.getPeelCount() > 0) {
1313
control = control | spv::LoopControlMask::PeelCount;
1314
operands.push_back(loopNode.getPeelCount());
1315
}
1316
if (loopNode.getPartialCount() > 0) {
1317
control = control | spv::LoopControlMask::PartialCount;
1318
operands.push_back(loopNode.getPartialCount());
1319
}
1320
}
1321
1322
return control;
1323
}
1324
1325
// Translate glslang type to SPIR-V storage class.
1326
spv::StorageClass TGlslangToSpvTraverser::TranslateStorageClass(const glslang::TType& type)
1327
{
1328
if (type.getBasicType() == glslang::EbtRayQuery || type.getBasicType() == glslang::EbtHitObjectNV
1329
|| type.getBasicType() == glslang::EbtHitObjectEXT)
1330
return spv::StorageClass::Private;
1331
if (type.getQualifier().isSpirvByReference()) {
1332
if (type.getQualifier().isParamInput() || type.getQualifier().isParamOutput())
1333
return spv::StorageClass::Function;
1334
}
1335
if (type.getQualifier().isPipeInput())
1336
return spv::StorageClass::Input;
1337
if (type.getQualifier().isPipeOutput())
1338
return spv::StorageClass::Output;
1339
if (type.getQualifier().storage == glslang::EvqTileImageEXT || type.isAttachmentEXT()) {
1340
builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
1341
builder.addCapability(spv::Capability::TileImageColorReadAccessEXT);
1342
return spv::StorageClass::TileImageEXT;
1343
}
1344
1345
if (type.getQualifier().isTileAttachmentQCOM()) {
1346
builder.addExtension(spv::E_SPV_QCOM_tile_shading);
1347
builder.addCapability(spv::Capability::TileShadingQCOM);
1348
return spv::StorageClass::TileAttachmentQCOM;
1349
}
1350
1351
if (glslangIntermediate->getSource() != glslang::EShSourceHlsl ||
1352
type.getQualifier().storage == glslang::EvqUniform) {
1353
if (type.isAtomic())
1354
return spv::StorageClass::AtomicCounter;
1355
if (type.containsOpaque() && !glslangIntermediate->getBindlessMode())
1356
return spv::StorageClass::UniformConstant;
1357
}
1358
1359
if (type.getQualifier().isUniformOrBuffer() &&
1360
type.getQualifier().isShaderRecord()) {
1361
return spv::StorageClass::ShaderRecordBufferKHR;
1362
}
1363
1364
if (glslangIntermediate->usingStorageBuffer() && type.getQualifier().storage == glslang::EvqBuffer) {
1365
builder.addIncorporatedExtension(spv::E_SPV_KHR_storage_buffer_storage_class, spv::Spv_1_3);
1366
return spv::StorageClass::StorageBuffer;
1367
}
1368
1369
if (type.getQualifier().isUniformOrBuffer()) {
1370
if (type.getQualifier().isPushConstant())
1371
return spv::StorageClass::PushConstant;
1372
if (type.getBasicType() == glslang::EbtBlock)
1373
return spv::StorageClass::Uniform;
1374
return spv::StorageClass::UniformConstant;
1375
}
1376
1377
if (type.getQualifier().storage == glslang::EvqShared && type.getBasicType() == glslang::EbtBlock) {
1378
builder.addExtension(spv::E_SPV_KHR_workgroup_memory_explicit_layout);
1379
builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayoutKHR);
1380
return spv::StorageClass::Workgroup;
1381
}
1382
1383
switch (type.getQualifier().storage) {
1384
case glslang::EvqGlobal: return spv::StorageClass::Private;
1385
case glslang::EvqConstReadOnly: return spv::StorageClass::Function;
1386
case glslang::EvqTemporary: return spv::StorageClass::Function;
1387
case glslang::EvqShared: return spv::StorageClass::Workgroup;
1388
case glslang::EvqPayload: return spv::StorageClass::RayPayloadKHR;
1389
case glslang::EvqPayloadIn: return spv::StorageClass::IncomingRayPayloadKHR;
1390
case glslang::EvqHitAttr: return spv::StorageClass::HitAttributeKHR;
1391
case glslang::EvqCallableData: return spv::StorageClass::CallableDataKHR;
1392
case glslang::EvqCallableDataIn: return spv::StorageClass::IncomingCallableDataKHR;
1393
case glslang::EvqtaskPayloadSharedEXT : return spv::StorageClass::TaskPayloadWorkgroupEXT;
1394
case glslang::EvqHitObjectAttrNV: return spv::StorageClass::HitObjectAttributeNV;
1395
case glslang::EvqHitObjectAttrEXT: return spv::StorageClass::HitObjectAttributeEXT;
1396
case glslang::EvqSpirvStorageClass: return static_cast<spv::StorageClass>(type.getQualifier().spirvStorageClass);
1397
default:
1398
assert(0);
1399
break;
1400
}
1401
1402
return spv::StorageClass::Function;
1403
}
1404
1405
// Translate glslang constants to SPIR-V literals
1406
void TGlslangToSpvTraverser::TranslateLiterals(const glslang::TVector<const glslang::TIntermConstantUnion*>& constants,
1407
std::vector<unsigned>& literals) const
1408
{
1409
for (auto constant : constants) {
1410
if (constant->getBasicType() == glslang::EbtFloat) {
1411
float floatValue = static_cast<float>(constant->getConstArray()[0].getDConst());
1412
unsigned literal;
1413
static_assert(sizeof(literal) == sizeof(floatValue), "sizeof(unsigned) != sizeof(float)");
1414
memcpy(&literal, &floatValue, sizeof(literal));
1415
literals.push_back(literal);
1416
} else if (constant->getBasicType() == glslang::EbtInt) {
1417
unsigned literal = constant->getConstArray()[0].getIConst();
1418
literals.push_back(literal);
1419
} else if (constant->getBasicType() == glslang::EbtUint) {
1420
unsigned literal = constant->getConstArray()[0].getUConst();
1421
literals.push_back(literal);
1422
} else if (constant->getBasicType() == glslang::EbtBool) {
1423
unsigned literal = constant->getConstArray()[0].getBConst();
1424
literals.push_back(literal);
1425
} else if (constant->getBasicType() == glslang::EbtString) {
1426
auto str = constant->getConstArray()[0].getSConst()->c_str();
1427
unsigned literal = 0;
1428
char* literalPtr = reinterpret_cast<char*>(&literal);
1429
unsigned charCount = 0;
1430
char ch = 0;
1431
do {
1432
ch = *(str++);
1433
*(literalPtr++) = ch;
1434
++charCount;
1435
if (charCount == 4) {
1436
literals.push_back(literal);
1437
literalPtr = reinterpret_cast<char*>(&literal);
1438
charCount = 0;
1439
}
1440
} while (ch != 0);
1441
1442
// Partial literal is padded with 0
1443
if (charCount > 0) {
1444
for (; charCount < 4; ++charCount)
1445
*(literalPtr++) = 0;
1446
literals.push_back(literal);
1447
}
1448
} else
1449
assert(0); // Unexpected type
1450
}
1451
}
1452
1453
// Add capabilities pertaining to how an array is indexed.
1454
void TGlslangToSpvTraverser::addIndirectionIndexCapabilities(const glslang::TType& baseType,
1455
const glslang::TType& indexType)
1456
{
1457
if (indexType.getQualifier().isNonUniform()) {
1458
// deal with an asserted non-uniform index
1459
// SPV_EXT_descriptor_indexing already added in TranslateNonUniformDecoration
1460
if (baseType.getBasicType() == glslang::EbtSampler) {
1461
if (baseType.getQualifier().hasAttachment())
1462
builder.addCapability(spv::Capability::InputAttachmentArrayNonUniformIndexingEXT);
1463
else if (baseType.isImage() && baseType.getSampler().isBuffer())
1464
builder.addCapability(spv::Capability::StorageTexelBufferArrayNonUniformIndexingEXT);
1465
else if (baseType.isTexture() && baseType.getSampler().isBuffer())
1466
builder.addCapability(spv::Capability::UniformTexelBufferArrayNonUniformIndexingEXT);
1467
else if (baseType.isImage())
1468
builder.addCapability(spv::Capability::StorageImageArrayNonUniformIndexingEXT);
1469
else if (baseType.isTexture())
1470
builder.addCapability(spv::Capability::SampledImageArrayNonUniformIndexingEXT);
1471
} else if (baseType.getBasicType() == glslang::EbtBlock) {
1472
if (baseType.getQualifier().storage == glslang::EvqBuffer)
1473
builder.addCapability(spv::Capability::StorageBufferArrayNonUniformIndexingEXT);
1474
else if (baseType.getQualifier().storage == glslang::EvqUniform)
1475
builder.addCapability(spv::Capability::UniformBufferArrayNonUniformIndexingEXT);
1476
}
1477
} else {
1478
// assume a dynamically uniform index
1479
if (baseType.getBasicType() == glslang::EbtSampler) {
1480
if (baseType.getQualifier().hasAttachment()) {
1481
builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
1482
builder.addCapability(spv::Capability::InputAttachmentArrayDynamicIndexingEXT);
1483
} else if (baseType.isImage() && baseType.getSampler().isBuffer()) {
1484
builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
1485
builder.addCapability(spv::Capability::StorageTexelBufferArrayDynamicIndexingEXT);
1486
} else if (baseType.isTexture() && baseType.getSampler().isBuffer()) {
1487
builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
1488
builder.addCapability(spv::Capability::UniformTexelBufferArrayDynamicIndexingEXT);
1489
}
1490
}
1491
}
1492
}
1493
1494
// Return whether or not the given type is something that should be tied to a
1495
// descriptor set.
1496
bool IsDescriptorResource(const glslang::TType& type)
1497
{
1498
// uniform and buffer blocks are included, unless it is a push_constant
1499
if (type.getBasicType() == glslang::EbtBlock)
1500
return type.getQualifier().isUniformOrBuffer() &&
1501
! type.getQualifier().isShaderRecord() &&
1502
! type.getQualifier().isPushConstant();
1503
1504
// non block...
1505
// basically samplerXXX/subpass/sampler/texture are all included
1506
// if they are the global-scope-class, not the function parameter
1507
// (or local, if they ever exist) class.
1508
if (type.getBasicType() == glslang::EbtSampler ||
1509
type.getBasicType() == glslang::EbtAccStruct)
1510
return type.getQualifier().isUniformOrBuffer();
1511
1512
// Tensors are tied to a descriptor.
1513
if (type.isTensorARM())
1514
return true;
1515
1516
// None of the above.
1517
return false;
1518
}
1519
1520
void InheritQualifiers(glslang::TQualifier& child, const glslang::TQualifier& parent)
1521
{
1522
if (child.layoutMatrix == glslang::ElmNone)
1523
child.layoutMatrix = parent.layoutMatrix;
1524
1525
if (parent.invariant)
1526
child.invariant = true;
1527
if (parent.flat)
1528
child.flat = true;
1529
if (parent.centroid)
1530
child.centroid = true;
1531
if (parent.nopersp)
1532
child.nopersp = true;
1533
if (parent.explicitInterp)
1534
child.explicitInterp = true;
1535
if (parent.perPrimitiveNV)
1536
child.perPrimitiveNV = true;
1537
if (parent.perViewNV)
1538
child.perViewNV = true;
1539
if (parent.perTaskNV)
1540
child.perTaskNV = true;
1541
if (parent.storage == glslang::EvqtaskPayloadSharedEXT)
1542
child.storage = glslang::EvqtaskPayloadSharedEXT;
1543
if (parent.patch)
1544
child.patch = true;
1545
if (parent.sample)
1546
child.sample = true;
1547
if (parent.coherent)
1548
child.coherent = true;
1549
if (parent.devicecoherent)
1550
child.devicecoherent = true;
1551
if (parent.queuefamilycoherent)
1552
child.queuefamilycoherent = true;
1553
if (parent.workgroupcoherent)
1554
child.workgroupcoherent = true;
1555
if (parent.subgroupcoherent)
1556
child.subgroupcoherent = true;
1557
if (parent.shadercallcoherent)
1558
child.shadercallcoherent = true;
1559
if (parent.nonprivate)
1560
child.nonprivate = true;
1561
if (parent.volatil)
1562
child.volatil = true;
1563
if (parent.nontemporal)
1564
child.nontemporal = true;
1565
if (parent.restrict)
1566
child.restrict = true;
1567
if (parent.readonly)
1568
child.readonly = true;
1569
if (parent.writeonly)
1570
child.writeonly = true;
1571
if (parent.nonUniform)
1572
child.nonUniform = true;
1573
}
1574
1575
bool HasNonLayoutQualifiers(const glslang::TType& type, const glslang::TQualifier& qualifier)
1576
{
1577
// This should list qualifiers that simultaneous satisfy:
1578
// - struct members might inherit from a struct declaration
1579
// (note that non-block structs don't explicitly inherit,
1580
// only implicitly, meaning no decoration involved)
1581
// - affect decorations on the struct members
1582
// (note smooth does not, and expecting something like volatile
1583
// to effect the whole object)
1584
// - are not part of the offset/st430/etc or row/column-major layout
1585
return qualifier.invariant || (qualifier.hasLocation() && type.getBasicType() == glslang::EbtBlock);
1586
}
1587
1588
//
1589
// Implement the TGlslangToSpvTraverser class.
1590
//
1591
1592
TGlslangToSpvTraverser::TGlslangToSpvTraverser(unsigned int spvVersion,
1593
const glslang::TIntermediate* glslangIntermediate,
1594
spv::SpvBuildLogger* buildLogger, glslang::SpvOptions& options) :
1595
TIntermTraverser(true, false, true),
1596
options(options),
1597
shaderEntry(nullptr), currentFunction(nullptr),
1598
sequenceDepth(0), logger(buildLogger),
1599
builder(spvVersion, (glslang::GetKhronosToolId() << 16) | glslang::GetSpirvGeneratorVersion(), logger),
1600
inEntryPoint(false), entryPointTerminated(false), linkageOnly(false),
1601
glslangIntermediate(glslangIntermediate),
1602
nanMinMaxClamp(glslangIntermediate->getNanMinMaxClamp()),
1603
nonSemanticDebugPrintf(0),
1604
taskPayloadID(0)
1605
{
1606
bool isMeshShaderExt = (glslangIntermediate->getRequestedExtensions().find(glslang::E_GL_EXT_mesh_shader) !=
1607
glslangIntermediate->getRequestedExtensions().end());
1608
spv::ExecutionModel executionModel = TranslateExecutionModel(glslangIntermediate->getStage(), isMeshShaderExt);
1609
1610
builder.clearAccessChain();
1611
builder.setSource(TranslateSourceLanguage(glslangIntermediate->getSource(), glslangIntermediate->getProfile()),
1612
glslangIntermediate->getVersion());
1613
1614
if (options.emitNonSemanticShaderDebugSource)
1615
this->options.emitNonSemanticShaderDebugInfo = true;
1616
if (options.emitNonSemanticShaderDebugInfo)
1617
this->options.generateDebugInfo = true;
1618
1619
if (this->options.generateDebugInfo) {
1620
if (this->options.emitNonSemanticShaderDebugInfo) {
1621
builder.setEmitNonSemanticShaderDebugInfo(this->options.emitNonSemanticShaderDebugSource);
1622
}
1623
else {
1624
builder.setEmitSpirvDebugInfo();
1625
}
1626
builder.setDebugMainSourceFile(glslangIntermediate->getSourceFile());
1627
1628
// Set the source shader's text. If for SPV version 1.0, include
1629
// a preamble in comments stating the OpModuleProcessed instructions.
1630
// Otherwise, emit those as actual instructions.
1631
std::string text;
1632
const std::vector<std::string>& processes = glslangIntermediate->getProcesses();
1633
for (int p = 0; p < (int)processes.size(); ++p) {
1634
if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1) {
1635
text.append("// OpModuleProcessed ");
1636
text.append(processes[p]);
1637
text.append("\n");
1638
} else
1639
builder.addModuleProcessed(processes[p]);
1640
}
1641
if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_1 && (int)processes.size() > 0)
1642
text.append("#line 1\n");
1643
text.append(glslangIntermediate->getSourceText());
1644
builder.setSourceText(text);
1645
// Pass name and text for all included files
1646
const std::map<std::string, std::string>& include_txt = glslangIntermediate->getIncludeText();
1647
for (auto iItr = include_txt.begin(); iItr != include_txt.end(); ++iItr)
1648
builder.addInclude(iItr->first, iItr->second);
1649
}
1650
1651
builder.setUseReplicatedComposites(glslangIntermediate->usingReplicatedComposites());
1652
1653
stdBuiltins = builder.import("GLSL.std.450");
1654
1655
spv::AddressingModel addressingModel = spv::AddressingModel::Logical;
1656
spv::MemoryModel memoryModel = spv::MemoryModel::GLSL450;
1657
1658
if (glslangIntermediate->usingPhysicalStorageBuffer()) {
1659
addressingModel = spv::AddressingModel::PhysicalStorageBuffer64EXT;
1660
builder.addIncorporatedExtension(spv::E_SPV_KHR_physical_storage_buffer, spv::Spv_1_5);
1661
builder.addCapability(spv::Capability::PhysicalStorageBufferAddressesEXT);
1662
}
1663
if (glslangIntermediate->usingVulkanMemoryModel()) {
1664
memoryModel = spv::MemoryModel::VulkanKHR;
1665
builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
1666
builder.addIncorporatedExtension(spv::E_SPV_KHR_vulkan_memory_model, spv::Spv_1_5);
1667
}
1668
builder.setMemoryModel(addressingModel, memoryModel);
1669
1670
if (glslangIntermediate->usingVariablePointers()) {
1671
builder.addCapability(spv::Capability::VariablePointers);
1672
}
1673
1674
// If not linking, there is no entry point
1675
if (!options.compileOnly) {
1676
shaderEntry = builder.makeEntryPoint(glslangIntermediate->getEntryPointName().c_str());
1677
entryPoint =
1678
builder.addEntryPoint(executionModel, shaderEntry, glslangIntermediate->getEntryPointName().c_str());
1679
}
1680
1681
// Add the source extensions
1682
const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();
1683
for (auto it = sourceExtensions.begin(); it != sourceExtensions.end(); ++it)
1684
builder.addSourceExtension(it->c_str());
1685
1686
// Add the top-level modes for this shader.
1687
1688
if (glslangIntermediate->getXfbMode()) {
1689
builder.addCapability(spv::Capability::TransformFeedback);
1690
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Xfb);
1691
}
1692
1693
if (glslangIntermediate->getLayoutPrimitiveCulling()) {
1694
builder.addCapability(spv::Capability::RayTraversalPrimitiveCullingKHR);
1695
}
1696
1697
if (glslangIntermediate->getSubgroupUniformControlFlow()) {
1698
builder.addExtension(spv::E_SPV_KHR_subgroup_uniform_control_flow);
1699
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::SubgroupUniformControlFlowKHR);
1700
}
1701
if (glslangIntermediate->getMaximallyReconverges()) {
1702
builder.addExtension(spv::E_SPV_KHR_maximal_reconvergence);
1703
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::MaximallyReconvergesKHR);
1704
}
1705
1706
if (glslangIntermediate->getQuadDerivMode())
1707
{
1708
builder.addCapability(spv::Capability::QuadControlKHR);
1709
builder.addExtension(spv::E_SPV_KHR_quad_control);
1710
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::QuadDerivativesKHR);
1711
}
1712
1713
if (glslangIntermediate->getReqFullQuadsMode())
1714
{
1715
builder.addCapability(spv::Capability::QuadControlKHR);
1716
builder.addExtension(spv::E_SPV_KHR_quad_control);
1717
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::RequireFullQuadsKHR);
1718
}
1719
1720
if (glslangIntermediate->usingShader64BitIndexing())
1721
{
1722
builder.addCapability(spv::Capability::Shader64BitIndexingEXT);
1723
builder.addExtension(spv::E_SPV_EXT_shader_64bit_indexing);
1724
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Shader64BitIndexingEXT);
1725
}
1726
1727
spv::ExecutionMode mode;
1728
switch (glslangIntermediate->getStage()) {
1729
case EShLangVertex:
1730
builder.addCapability(spv::Capability::Shader);
1731
break;
1732
1733
case EShLangFragment:
1734
builder.addCapability(spv::Capability::Shader);
1735
if (glslangIntermediate->getPixelCenterInteger())
1736
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PixelCenterInteger);
1737
1738
if (glslangIntermediate->getOriginUpperLeft())
1739
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OriginUpperLeft);
1740
else
1741
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OriginLowerLeft);
1742
1743
if (glslangIntermediate->getEarlyFragmentTests())
1744
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::EarlyFragmentTests);
1745
1746
if (glslangIntermediate->getEarlyAndLateFragmentTestsAMD())
1747
{
1748
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::EarlyAndLateFragmentTestsAMD);
1749
builder.addExtension(spv::E_SPV_AMD_shader_early_and_late_fragment_tests);
1750
}
1751
1752
if (glslangIntermediate->getPostDepthCoverage()) {
1753
builder.addCapability(spv::Capability::SampleMaskPostDepthCoverage);
1754
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PostDepthCoverage);
1755
builder.addExtension(spv::E_SPV_KHR_post_depth_coverage);
1756
}
1757
1758
if (glslangIntermediate->getNonCoherentColorAttachmentReadEXT()) {
1759
builder.addCapability(spv::Capability::TileImageColorReadAccessEXT);
1760
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentColorAttachmentReadEXT);
1761
builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
1762
}
1763
1764
if (glslangIntermediate->getNonCoherentDepthAttachmentReadEXT()) {
1765
builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
1766
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentDepthAttachmentReadEXT);
1767
builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
1768
}
1769
1770
if (glslangIntermediate->getNonCoherentStencilAttachmentReadEXT()) {
1771
builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
1772
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentStencilAttachmentReadEXT);
1773
builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
1774
}
1775
1776
if (glslangIntermediate->getNonCoherentTileAttachmentReadQCOM()) {
1777
builder.addCapability(spv::Capability::TileShadingQCOM);
1778
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentTileAttachmentReadQCOM);
1779
builder.addExtension(spv::E_SPV_QCOM_tile_shading);
1780
}
1781
1782
if (glslangIntermediate->isDepthReplacing())
1783
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DepthReplacing);
1784
1785
if (glslangIntermediate->isStencilReplacing())
1786
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::StencilRefReplacingEXT);
1787
1788
switch(glslangIntermediate->getDepth()) {
1789
case glslang::EldGreater: mode = spv::ExecutionMode::DepthGreater; break;
1790
case glslang::EldLess: mode = spv::ExecutionMode::DepthLess; break;
1791
case glslang::EldUnchanged: mode = spv::ExecutionMode::DepthUnchanged; break;
1792
default: mode = spv::ExecutionMode::Max; break;
1793
}
1794
1795
if (mode != spv::ExecutionMode::Max)
1796
builder.addExecutionMode(shaderEntry, mode);
1797
1798
switch (glslangIntermediate->getStencil()) {
1799
case glslang::ElsRefUnchangedFrontAMD: mode = spv::ExecutionMode::StencilRefUnchangedFrontAMD; break;
1800
case glslang::ElsRefGreaterFrontAMD: mode = spv::ExecutionMode::StencilRefGreaterFrontAMD; break;
1801
case glslang::ElsRefLessFrontAMD: mode = spv::ExecutionMode::StencilRefLessFrontAMD; break;
1802
case glslang::ElsRefUnchangedBackAMD: mode = spv::ExecutionMode::StencilRefUnchangedBackAMD; break;
1803
case glslang::ElsRefGreaterBackAMD: mode = spv::ExecutionMode::StencilRefGreaterBackAMD; break;
1804
case glslang::ElsRefLessBackAMD: mode = spv::ExecutionMode::StencilRefLessBackAMD; break;
1805
default: mode = spv::ExecutionMode::Max; break;
1806
}
1807
1808
if (mode != spv::ExecutionMode::Max)
1809
builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
1810
switch (glslangIntermediate->getInterlockOrdering()) {
1811
case glslang::EioPixelInterlockOrdered: mode = spv::ExecutionMode::PixelInterlockOrderedEXT;
1812
break;
1813
case glslang::EioPixelInterlockUnordered: mode = spv::ExecutionMode::PixelInterlockUnorderedEXT;
1814
break;
1815
case glslang::EioSampleInterlockOrdered: mode = spv::ExecutionMode::SampleInterlockOrderedEXT;
1816
break;
1817
case glslang::EioSampleInterlockUnordered: mode = spv::ExecutionMode::SampleInterlockUnorderedEXT;
1818
break;
1819
case glslang::EioShadingRateInterlockOrdered: mode = spv::ExecutionMode::ShadingRateInterlockOrderedEXT;
1820
break;
1821
case glslang::EioShadingRateInterlockUnordered: mode = spv::ExecutionMode::ShadingRateInterlockUnorderedEXT;
1822
break;
1823
default: mode = spv::ExecutionMode::Max;
1824
break;
1825
}
1826
if (mode != spv::ExecutionMode::Max) {
1827
builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
1828
if (mode == spv::ExecutionMode::ShadingRateInterlockOrderedEXT ||
1829
mode == spv::ExecutionMode::ShadingRateInterlockUnorderedEXT) {
1830
builder.addCapability(spv::Capability::FragmentShaderShadingRateInterlockEXT);
1831
} else if (mode == spv::ExecutionMode::PixelInterlockOrderedEXT ||
1832
mode == spv::ExecutionMode::PixelInterlockUnorderedEXT) {
1833
builder.addCapability(spv::Capability::FragmentShaderPixelInterlockEXT);
1834
} else {
1835
builder.addCapability(spv::Capability::FragmentShaderSampleInterlockEXT);
1836
}
1837
builder.addExtension(spv::E_SPV_EXT_fragment_shader_interlock);
1838
}
1839
break;
1840
1841
case EShLangCompute: {
1842
builder.addCapability(spv::Capability::Shader);
1843
bool needSizeId = false;
1844
for (int dim = 0; dim < 3; ++dim) {
1845
if ((glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet)) {
1846
needSizeId = true;
1847
break;
1848
}
1849
}
1850
if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6 && needSizeId) {
1851
std::vector<spv::Id> dimConstId;
1852
for (int dim = 0; dim < 3; ++dim) {
1853
bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
1854
dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
1855
if (specConst) {
1856
builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
1857
glslangIntermediate->getLocalSizeSpecId(dim));
1858
needSizeId = true;
1859
}
1860
}
1861
builder.addExecutionModeId(shaderEntry, spv::ExecutionMode::LocalSizeId, dimConstId);
1862
} else {
1863
if (glslangIntermediate->getTileShadingRateQCOM(0) >= 1 || glslangIntermediate->getTileShadingRateQCOM(1) >= 1 || glslangIntermediate->getTileShadingRateQCOM(2) >= 1) {
1864
auto rate_x = glslangIntermediate->getTileShadingRateQCOM(0);
1865
auto rate_y = glslangIntermediate->getTileShadingRateQCOM(1);
1866
auto rate_z = glslangIntermediate->getTileShadingRateQCOM(2);
1867
rate_x = ( rate_x == 0 ? 1 : rate_x );
1868
rate_y = ( rate_y == 0 ? 1 : rate_y );
1869
rate_z = ( rate_z == 0 ? 1 : rate_z );
1870
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::TileShadingRateQCOM, rate_x, rate_y, rate_z);
1871
} else {
1872
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::LocalSize, glslangIntermediate->getLocalSize(0),
1873
glslangIntermediate->getLocalSize(1),
1874
glslangIntermediate->getLocalSize(2));
1875
}
1876
}
1877
if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupQuads) {
1878
builder.addCapability(spv::Capability::ComputeDerivativeGroupQuadsNV);
1879
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DerivativeGroupQuadsNV);
1880
builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);
1881
} else if (glslangIntermediate->getLayoutDerivativeModeNone() == glslang::LayoutDerivativeGroupLinear) {
1882
builder.addCapability(spv::Capability::ComputeDerivativeGroupLinearNV);
1883
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::DerivativeGroupLinearNV);
1884
builder.addExtension(spv::E_SPV_NV_compute_shader_derivatives);
1885
}
1886
1887
if (glslangIntermediate->getNonCoherentTileAttachmentReadQCOM()) {
1888
builder.addCapability(spv::Capability::TileShadingQCOM);
1889
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::NonCoherentTileAttachmentReadQCOM);
1890
builder.addExtension(spv::E_SPV_QCOM_tile_shading);
1891
}
1892
1893
break;
1894
}
1895
case EShLangTessEvaluation:
1896
case EShLangTessControl:
1897
builder.addCapability(spv::Capability::Tessellation);
1898
1899
glslang::TLayoutGeometry primitive;
1900
1901
if (glslangIntermediate->getStage() == EShLangTessControl) {
1902
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices,
1903
glslangIntermediate->getVertices());
1904
primitive = glslangIntermediate->getOutputPrimitive();
1905
} else {
1906
primitive = glslangIntermediate->getInputPrimitive();
1907
}
1908
1909
switch (primitive) {
1910
case glslang::ElgTriangles: mode = spv::ExecutionMode::Triangles; break;
1911
case glslang::ElgQuads: mode = spv::ExecutionMode::Quads; break;
1912
case glslang::ElgIsolines: mode = spv::ExecutionMode::Isolines; break;
1913
default: mode = spv::ExecutionMode::Max; break;
1914
}
1915
if (mode != spv::ExecutionMode::Max)
1916
builder.addExecutionMode(shaderEntry, mode);
1917
1918
switch (glslangIntermediate->getVertexSpacing()) {
1919
case glslang::EvsEqual: mode = spv::ExecutionMode::SpacingEqual; break;
1920
case glslang::EvsFractionalEven: mode = spv::ExecutionMode::SpacingFractionalEven; break;
1921
case glslang::EvsFractionalOdd: mode = spv::ExecutionMode::SpacingFractionalOdd; break;
1922
default: mode = spv::ExecutionMode::Max; break;
1923
}
1924
if (mode != spv::ExecutionMode::Max)
1925
builder.addExecutionMode(shaderEntry, mode);
1926
1927
switch (glslangIntermediate->getVertexOrder()) {
1928
case glslang::EvoCw: mode = spv::ExecutionMode::VertexOrderCw; break;
1929
case glslang::EvoCcw: mode = spv::ExecutionMode::VertexOrderCcw; break;
1930
default: mode = spv::ExecutionMode::Max; break;
1931
}
1932
if (mode != spv::ExecutionMode::Max)
1933
builder.addExecutionMode(shaderEntry, mode);
1934
1935
if (glslangIntermediate->getPointMode())
1936
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::PointMode);
1937
break;
1938
1939
case EShLangGeometry:
1940
builder.addCapability(spv::Capability::Geometry);
1941
switch (glslangIntermediate->getInputPrimitive()) {
1942
case glslang::ElgPoints: mode = spv::ExecutionMode::InputPoints; break;
1943
case glslang::ElgLines: mode = spv::ExecutionMode::InputLines; break;
1944
case glslang::ElgLinesAdjacency: mode = spv::ExecutionMode::InputLinesAdjacency; break;
1945
case glslang::ElgTriangles: mode = spv::ExecutionMode::Triangles; break;
1946
case glslang::ElgTrianglesAdjacency: mode = spv::ExecutionMode::InputTrianglesAdjacency; break;
1947
default: mode = spv::ExecutionMode::Max; break;
1948
}
1949
if (mode != spv::ExecutionMode::Max)
1950
builder.addExecutionMode(shaderEntry, mode);
1951
1952
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::Invocations, glslangIntermediate->getInvocations());
1953
1954
switch (glslangIntermediate->getOutputPrimitive()) {
1955
case glslang::ElgPoints: mode = spv::ExecutionMode::OutputPoints; break;
1956
case glslang::ElgLineStrip: mode = spv::ExecutionMode::OutputLineStrip; break;
1957
case glslang::ElgTriangleStrip: mode = spv::ExecutionMode::OutputTriangleStrip; break;
1958
default: mode = spv::ExecutionMode::Max; break;
1959
}
1960
if (mode != spv::ExecutionMode::Max)
1961
builder.addExecutionMode(shaderEntry, mode);
1962
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices, glslangIntermediate->getVertices());
1963
break;
1964
1965
case EShLangRayGen:
1966
case EShLangIntersect:
1967
case EShLangAnyHit:
1968
case EShLangClosestHit:
1969
case EShLangMiss:
1970
case EShLangCallable:
1971
{
1972
auto& extensions = glslangIntermediate->getRequestedExtensions();
1973
if (extensions.find("GL_EXT_opacity_micromap") != extensions.end()) {
1974
builder.addCapability(spv::Capability::RayTracingOpacityMicromapEXT);
1975
builder.addExtension("SPV_EXT_opacity_micromap");
1976
}
1977
if (extensions.find("GL_NV_ray_tracing") == extensions.end()) {
1978
builder.addCapability(spv::Capability::RayTracingKHR);
1979
builder.addExtension("SPV_KHR_ray_tracing");
1980
}
1981
else {
1982
builder.addCapability(spv::Capability::RayTracingNV);
1983
builder.addExtension("SPV_NV_ray_tracing");
1984
}
1985
if (glslangIntermediate->getStage() != EShLangRayGen && glslangIntermediate->getStage() != EShLangCallable) {
1986
if (extensions.find("GL_EXT_ray_cull_mask") != extensions.end()) {
1987
builder.addCapability(spv::Capability::RayCullMaskKHR);
1988
builder.addExtension("SPV_KHR_ray_cull_mask");
1989
}
1990
if (extensions.find("GL_EXT_ray_tracing_position_fetch") != extensions.end()) {
1991
builder.addCapability(spv::Capability::RayTracingPositionFetchKHR);
1992
builder.addExtension("SPV_KHR_ray_tracing_position_fetch");
1993
}
1994
}
1995
break;
1996
}
1997
case EShLangTask:
1998
case EShLangMesh:
1999
if(isMeshShaderExt) {
2000
builder.addCapability(spv::Capability::MeshShadingEXT);
2001
builder.addExtension(spv::E_SPV_EXT_mesh_shader);
2002
} else {
2003
builder.addCapability(spv::Capability::MeshShadingNV);
2004
builder.addExtension(spv::E_SPV_NV_mesh_shader);
2005
}
2006
if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
2007
std::vector<spv::Id> dimConstId;
2008
for (int dim = 0; dim < 3; ++dim) {
2009
bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
2010
dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
2011
if (specConst) {
2012
builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
2013
glslangIntermediate->getLocalSizeSpecId(dim));
2014
}
2015
}
2016
builder.addExecutionModeId(shaderEntry, spv::ExecutionMode::LocalSizeId, dimConstId);
2017
} else {
2018
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::LocalSize, glslangIntermediate->getLocalSize(0),
2019
glslangIntermediate->getLocalSize(1),
2020
glslangIntermediate->getLocalSize(2));
2021
}
2022
if (glslangIntermediate->getStage() == EShLangMesh) {
2023
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputVertices,
2024
glslangIntermediate->getVertices());
2025
builder.addExecutionMode(shaderEntry, spv::ExecutionMode::OutputPrimitivesNV,
2026
glslangIntermediate->getPrimitives());
2027
2028
switch (glslangIntermediate->getOutputPrimitive()) {
2029
case glslang::ElgPoints: mode = spv::ExecutionMode::OutputPoints; break;
2030
case glslang::ElgLines: mode = spv::ExecutionMode::OutputLinesNV; break;
2031
case glslang::ElgTriangles: mode = spv::ExecutionMode::OutputTrianglesNV; break;
2032
default: mode = spv::ExecutionMode::Max; break;
2033
}
2034
if (mode != spv::ExecutionMode::Max)
2035
builder.addExecutionMode(shaderEntry, (spv::ExecutionMode)mode);
2036
}
2037
break;
2038
2039
default:
2040
break;
2041
}
2042
2043
//
2044
// Add SPIR-V requirements (GL_EXT_spirv_intrinsics)
2045
//
2046
if (glslangIntermediate->hasSpirvRequirement()) {
2047
const glslang::TSpirvRequirement& spirvRequirement = glslangIntermediate->getSpirvRequirement();
2048
2049
// Add SPIR-V extension requirement
2050
for (auto& extension : spirvRequirement.extensions)
2051
builder.addExtension(extension.c_str());
2052
2053
// Add SPIR-V capability requirement
2054
for (auto capability : spirvRequirement.capabilities)
2055
builder.addCapability(static_cast<spv::Capability>(capability));
2056
}
2057
2058
//
2059
// Add SPIR-V execution mode qualifiers (GL_EXT_spirv_intrinsics)
2060
//
2061
if (glslangIntermediate->hasSpirvExecutionMode()) {
2062
const glslang::TSpirvExecutionMode spirvExecutionMode = glslangIntermediate->getSpirvExecutionMode();
2063
2064
// Add spirv_execution_mode
2065
for (auto& mode : spirvExecutionMode.modes) {
2066
if (!mode.second.empty()) {
2067
std::vector<unsigned> literals;
2068
TranslateLiterals(mode.second, literals);
2069
builder.addExecutionMode(shaderEntry, static_cast<spv::ExecutionMode>(mode.first), literals);
2070
} else
2071
builder.addExecutionMode(shaderEntry, static_cast<spv::ExecutionMode>(mode.first));
2072
}
2073
2074
// Add spirv_execution_mode_id
2075
for (auto& modeId : spirvExecutionMode.modeIds) {
2076
std::vector<spv::Id> operandIds;
2077
assert(!modeId.second.empty());
2078
for (auto extraOperand : modeId.second) {
2079
if (extraOperand->getType().getQualifier().isSpecConstant())
2080
operandIds.push_back(getSymbolId(extraOperand->getAsSymbolNode()));
2081
else
2082
operandIds.push_back(createSpvConstant(*extraOperand));
2083
}
2084
builder.addExecutionModeId(shaderEntry, static_cast<spv::ExecutionMode>(modeId.first), operandIds);
2085
}
2086
}
2087
}
2088
2089
// Finish creating SPV, after the traversal is complete.
2090
void TGlslangToSpvTraverser::finishSpv(bool compileOnly)
2091
{
2092
// If not linking, an entry point is not expected
2093
if (!compileOnly) {
2094
// Finish the entry point function
2095
if (!entryPointTerminated) {
2096
builder.setBuildPoint(shaderEntry->getLastBlock());
2097
builder.leaveFunction();
2098
}
2099
2100
// finish off the entry-point SPV instruction by adding the Input/Output <id>
2101
entryPoint->reserveOperands(iOSet.size());
2102
for (auto id : iOSet)
2103
entryPoint->addIdOperand(id);
2104
}
2105
2106
// Add capabilities, extensions, remove unneeded decorations, etc.,
2107
// based on the resulting SPIR-V.
2108
// Note: WebGPU code generation must have the opportunity to aggressively
2109
// prune unreachable merge blocks and continue targets.
2110
builder.postProcess(compileOnly);
2111
}
2112
2113
// Write the SPV into 'out'.
2114
void TGlslangToSpvTraverser::dumpSpv(std::vector<unsigned int>& out)
2115
{
2116
builder.dump(out);
2117
}
2118
2119
//
2120
// Implement the traversal functions.
2121
//
2122
// Return true from interior nodes to have the external traversal
2123
// continue on to children. Return false if children were
2124
// already processed.
2125
//
2126
2127
//
2128
// Symbols can turn into
2129
// - uniform/input reads
2130
// - output writes
2131
// - complex lvalue base setups: foo.bar[3].... , where we see foo and start up an access chain
2132
// - something simple that degenerates into the last bullet
2133
//
2134
void TGlslangToSpvTraverser::visitSymbol(glslang::TIntermSymbol* symbol)
2135
{
2136
// We update the line information even though no code might be generated here
2137
// This is helpful to yield correct lines for control flow instructions
2138
if (!linkageOnly) {
2139
builder.setDebugSourceLocation(symbol->getLoc().line, symbol->getLoc().getFilename());
2140
}
2141
2142
if (symbol->getBasicType() == glslang::EbtFunction) {
2143
return;
2144
}
2145
2146
SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
2147
if (symbol->getType().isStruct())
2148
glslangTypeToIdMap[symbol->getType().getStruct()] = symbol->getId();
2149
2150
if (symbol->getType().getQualifier().isSpecConstant())
2151
spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
2152
#ifdef ENABLE_HLSL
2153
// Skip symbol handling if it is string-typed
2154
if (symbol->getBasicType() == glslang::EbtString)
2155
return;
2156
#endif
2157
2158
// getSymbolId() will set up all the IO decorations on the first call.
2159
// Formal function parameters were mapped during makeFunctions().
2160
spv::Id id = getSymbolId(symbol);
2161
2162
if (symbol->getType().getQualifier().isTaskPayload())
2163
taskPayloadID = id; // cache the taskPayloadID to be used it as operand for OpEmitMeshTasksEXT
2164
2165
if (builder.isPointer(id)) {
2166
if (!symbol->getType().getQualifier().isParamInput() &&
2167
!symbol->getType().getQualifier().isParamOutput()) {
2168
// Include all "static use" and "linkage only" interface variables on the OpEntryPoint instruction
2169
// Consider adding to the OpEntryPoint interface list.
2170
// Only looking at structures if they have at least one member.
2171
if (!symbol->getType().isStruct() || symbol->getType().getStruct()->size() > 0) {
2172
spv::StorageClass sc = builder.getStorageClass(id);
2173
// Before SPIR-V 1.4, we only want to include Input and Output.
2174
// Starting with SPIR-V 1.4, we want all globals.
2175
if ((glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4 && builder.isGlobalVariable(id)) ||
2176
(sc == spv::StorageClass::Input || sc == spv::StorageClass::Output)) {
2177
iOSet.insert(id);
2178
}
2179
}
2180
}
2181
2182
// If the SPIR-V type is required to be different than the AST type
2183
// (for ex SubgroupMasks or 3x4 ObjectToWorld/WorldToObject matrices),
2184
// translate now from the SPIR-V type to the AST type, for the consuming
2185
// operation.
2186
// Note this turns it from an l-value to an r-value.
2187
// Currently, all symbols needing this are inputs; avoid the map lookup when non-input.
2188
if (symbol->getType().getQualifier().storage == glslang::EvqVaryingIn)
2189
id = translateForcedType(id);
2190
}
2191
2192
// Only process non-linkage-only nodes for generating actual static uses
2193
if (! linkageOnly || symbol->getQualifier().isSpecConstant()) {
2194
// Prepare to generate code for the access
2195
2196
// L-value chains will be computed left to right. We're on the symbol now,
2197
// which is the left-most part of the access chain, so now is "clear" time,
2198
// followed by setting the base.
2199
builder.clearAccessChain();
2200
2201
// For now, we consider all user variables as being in memory, so they are pointers,
2202
// except for
2203
// A) R-Value arguments to a function, which are an intermediate object.
2204
// See comments in handleUserFunctionCall().
2205
// B) Specialization constants (normal constants don't even come in as a variable),
2206
// These are also pure R-values.
2207
// C) R-Values from type translation, see above call to translateForcedType()
2208
glslang::TQualifier qualifier = symbol->getQualifier();
2209
if (qualifier.isSpecConstant() || rValueParameters.find(symbol->getId()) != rValueParameters.end() ||
2210
!builder.isPointerType(builder.getTypeId(id)))
2211
builder.setAccessChainRValue(id);
2212
else
2213
builder.setAccessChainLValue(id);
2214
}
2215
2216
#ifdef ENABLE_HLSL
2217
// Process linkage-only nodes for any special additional interface work.
2218
if (linkageOnly) {
2219
if (glslangIntermediate->getHlslFunctionality1()) {
2220
// Map implicit counter buffers to their originating buffers, which should have been
2221
// seen by now, given earlier pruning of unused counters, and preservation of order
2222
// of declaration.
2223
if (symbol->getType().getQualifier().isUniformOrBuffer()) {
2224
if (!glslangIntermediate->hasCounterBufferName(symbol->getName())) {
2225
// Save possible originating buffers for counter buffers, keyed by
2226
// making the potential counter-buffer name.
2227
std::string keyName = symbol->getName().c_str();
2228
keyName = glslangIntermediate->addCounterBufferName(keyName);
2229
counterOriginator[keyName] = symbol;
2230
} else {
2231
// Handle a counter buffer, by finding the saved originating buffer.
2232
std::string keyName = symbol->getName().c_str();
2233
auto it = counterOriginator.find(keyName);
2234
if (it != counterOriginator.end()) {
2235
id = getSymbolId(it->second);
2236
if (id != spv::NoResult) {
2237
spv::Id counterId = getSymbolId(symbol);
2238
if (counterId != spv::NoResult) {
2239
builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
2240
builder.addDecorationId(id, spv::Decoration::HlslCounterBufferGOOGLE, counterId);
2241
}
2242
}
2243
}
2244
}
2245
}
2246
}
2247
}
2248
#endif
2249
}
2250
2251
bool TGlslangToSpvTraverser::visitBinary(glslang::TVisit /* visit */, glslang::TIntermBinary* node)
2252
{
2253
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
2254
if (node->getLeft()->getAsSymbolNode() != nullptr && node->getLeft()->getType().isStruct()) {
2255
glslangTypeToIdMap[node->getLeft()->getType().getStruct()] = node->getLeft()->getAsSymbolNode()->getId();
2256
}
2257
if (node->getRight()->getAsSymbolNode() != nullptr && node->getRight()->getType().isStruct()) {
2258
glslangTypeToIdMap[node->getRight()->getType().getStruct()] = node->getRight()->getAsSymbolNode()->getId();
2259
}
2260
2261
SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
2262
if (node->getType().getQualifier().isSpecConstant())
2263
spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
2264
2265
// First, handle special cases
2266
switch (node->getOp()) {
2267
case glslang::EOpAssign:
2268
case glslang::EOpAddAssign:
2269
case glslang::EOpSubAssign:
2270
case glslang::EOpMulAssign:
2271
case glslang::EOpVectorTimesMatrixAssign:
2272
case glslang::EOpVectorTimesScalarAssign:
2273
case glslang::EOpMatrixTimesScalarAssign:
2274
case glslang::EOpMatrixTimesMatrixAssign:
2275
case glslang::EOpDivAssign:
2276
case glslang::EOpModAssign:
2277
case glslang::EOpAndAssign:
2278
case glslang::EOpInclusiveOrAssign:
2279
case glslang::EOpExclusiveOrAssign:
2280
case glslang::EOpLeftShiftAssign:
2281
case glslang::EOpRightShiftAssign:
2282
// A bin-op assign "a += b" means the same thing as "a = a + b"
2283
// where a is evaluated before b. For a simple assignment, GLSL
2284
// says to evaluate the left before the right. So, always, left
2285
// node then right node.
2286
{
2287
// get the left l-value, save it away
2288
builder.clearAccessChain();
2289
node->getLeft()->traverse(this);
2290
spv::Builder::AccessChain lValue = builder.getAccessChain();
2291
2292
// evaluate the right
2293
builder.clearAccessChain();
2294
node->getRight()->traverse(this);
2295
spv::Id rValue = accessChainLoad(node->getRight()->getType());
2296
2297
// reset line number for assignment
2298
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
2299
2300
if (node->getOp() != glslang::EOpAssign) {
2301
// the left is also an r-value
2302
builder.setAccessChain(lValue);
2303
spv::Id leftRValue = accessChainLoad(node->getLeft()->getType());
2304
2305
// do the operation
2306
spv::Builder::AccessChain::CoherentFlags coherentFlags = TranslateCoherent(node->getLeft()->getType());
2307
coherentFlags |= TranslateCoherent(node->getRight()->getType());
2308
OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
2309
TranslateNoContractionDecoration(node->getType().getQualifier()),
2310
TranslateNonUniformDecoration(coherentFlags) };
2311
rValue = createBinaryOperation(node->getOp(), decorations,
2312
convertGlslangToSpvType(node->getType()), leftRValue, rValue,
2313
node->getType().getBasicType());
2314
2315
// these all need their counterparts in createBinaryOperation()
2316
assert(rValue != spv::NoResult);
2317
}
2318
2319
// store the result
2320
builder.setAccessChain(lValue);
2321
multiTypeStore(node->getLeft()->getType(), rValue);
2322
2323
// assignments are expressions having an rValue after they are evaluated...
2324
builder.clearAccessChain();
2325
builder.setAccessChainRValue(rValue);
2326
}
2327
return false;
2328
case glslang::EOpIndexDirect:
2329
case glslang::EOpIndexDirectStruct:
2330
{
2331
// Structure, array, matrix, or vector indirection with statically known index.
2332
// Get the left part of the access chain.
2333
node->getLeft()->traverse(this);
2334
2335
// Add the next element in the chain
2336
2337
const int glslangIndex = node->getRight()->getAsConstantUnion()->getConstArray()[0].getIConst();
2338
if (! node->getLeft()->getType().isArray() &&
2339
node->getLeft()->getType().isVector() &&
2340
node->getOp() == glslang::EOpIndexDirect) {
2341
// Swizzle is uniform so propagate uniform into access chain
2342
spv::Builder::AccessChain::CoherentFlags coherentFlags = TranslateCoherent(node->getLeft()->getType());
2343
coherentFlags.nonUniform = 0;
2344
// This is essentially a hard-coded vector swizzle of size 1,
2345
// so short circuit the access-chain stuff with a swizzle.
2346
std::vector<unsigned> swizzle;
2347
swizzle.push_back(glslangIndex);
2348
int dummySize;
2349
builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),
2350
coherentFlags,
2351
glslangIntermediate->getBaseAlignmentScalar(
2352
node->getLeft()->getType(), dummySize));
2353
} else {
2354
2355
// Load through a block reference is performed with a dot operator that
2356
// is mapped to EOpIndexDirectStruct. When we get to the actual reference,
2357
// do a load and reset the access chain.
2358
if (node->getLeft()->isReference() &&
2359
!node->getLeft()->getType().isArray() &&
2360
node->getOp() == glslang::EOpIndexDirectStruct)
2361
{
2362
spv::Id left = accessChainLoad(node->getLeft()->getType());
2363
builder.clearAccessChain();
2364
builder.setAccessChainLValue(left);
2365
}
2366
2367
int spvIndex = glslangIndex;
2368
if (node->getLeft()->getBasicType() == glslang::EbtBlock &&
2369
node->getOp() == glslang::EOpIndexDirectStruct)
2370
{
2371
// This may be, e.g., an anonymous block-member selection, which generally need
2372
// index remapping due to hidden members in anonymous blocks.
2373
long long glslangId = glslangTypeToIdMap[node->getLeft()->getType().getStruct()];
2374
if (memberRemapper.find(glslangId) != memberRemapper.end()) {
2375
std::vector<int>& remapper = memberRemapper[glslangId];
2376
assert(remapper.size() > 0);
2377
spvIndex = remapper[glslangIndex];
2378
}
2379
}
2380
2381
// Struct reference propagates uniform lvalue
2382
spv::Builder::AccessChain::CoherentFlags coherentFlags =
2383
TranslateCoherent(node->getLeft()->getType());
2384
coherentFlags.nonUniform = 0;
2385
2386
// normal case for indexing array or structure or block
2387
if ((node->getRight()->getType().getBasicType() == glslang::EbtUint && glslangIntermediate->usingPromoteUint32Indices()) ||
2388
node->getRight()->getType().contains64BitInt()) {
2389
int64_t idx = node->getRight()->getType().contains64BitInt() ?
2390
node->getRight()->getAsConstantUnion()->getConstArray()[0].getI64Const() :
2391
node->getRight()->getAsConstantUnion()->getConstArray()[0].getUConst();
2392
builder.accessChainPush(builder.makeInt64Constant(idx),
2393
coherentFlags,
2394
node->getLeft()->getType().getBufferReferenceAlignment());
2395
2396
} else {
2397
builder.accessChainPush(builder.makeIntConstant(spvIndex),
2398
coherentFlags,
2399
node->getLeft()->getType().getBufferReferenceAlignment());
2400
}
2401
// Add capabilities here for accessing PointSize and clip/cull distance.
2402
// We have deferred generation of associated capabilities until now.
2403
if (node->getLeft()->getType().isStruct() && ! node->getLeft()->getType().isArray())
2404
declareUseOfStructMember(*(node->getLeft()->getType().getStruct()), glslangIndex);
2405
}
2406
}
2407
return false;
2408
case glslang::EOpIndexIndirect:
2409
{
2410
// Array, matrix, or vector indirection with variable index.
2411
// Will use native SPIR-V access-chain for and array indirection;
2412
// matrices are arrays of vectors, so will also work for a matrix.
2413
// Will use the access chain's 'component' for variable index into a vector.
2414
2415
// This adapter is building access chains left to right.
2416
// Set up the access chain to the left.
2417
node->getLeft()->traverse(this);
2418
2419
// save it so that computing the right side doesn't trash it
2420
spv::Builder::AccessChain partial = builder.getAccessChain();
2421
2422
// compute the next index in the chain
2423
builder.clearAccessChain();
2424
node->getRight()->traverse(this);
2425
spv::Id index = accessChainLoad(node->getRight()->getType());
2426
2427
// Zero-extend smaller unsigned integer types for array indexing.
2428
// SPIR-V OpAccessChain treats indices as signed, so we need to zero-extend
2429
// unsigned types to preserve their values (signed types are fine as-is).
2430
spv::Id indexType = builder.getTypeId(index);
2431
if (builder.isUintType(indexType) && builder.getScalarTypeWidth(indexType) < 32) {
2432
// Zero-extend unsigned types to preserve their values
2433
spv::Id uintType = builder.makeUintType(32);
2434
index = builder.createUnaryOp(spv::Op::OpUConvert, uintType, index);
2435
}
2436
2437
addIndirectionIndexCapabilities(node->getLeft()->getType(), node->getRight()->getType());
2438
2439
// restore the saved access chain
2440
builder.setAccessChain(partial);
2441
2442
// Only if index is nonUniform should we propagate nonUniform into access chain
2443
spv::Builder::AccessChain::CoherentFlags index_flags = TranslateCoherent(node->getRight()->getType());
2444
spv::Builder::AccessChain::CoherentFlags coherent_flags = TranslateCoherent(node->getLeft()->getType());
2445
coherent_flags.nonUniform = index_flags.nonUniform;
2446
2447
if (! node->getLeft()->getType().isArray() && node->getLeft()->getType().isVector()) {
2448
int dummySize;
2449
builder.accessChainPushComponent(
2450
index, convertGlslangToSpvType(node->getLeft()->getType()), coherent_flags,
2451
glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(),
2452
dummySize));
2453
} else {
2454
if (glslangIntermediate->usingPromoteUint32Indices() &&
2455
node->getRight()->getType().getBasicType() == glslang::EbtUint) {
2456
index = createIntWidthConversion(index, 0, builder.makeIntegerType(64, true), glslang::EbtInt64, node->getRight()->getType().getBasicType());
2457
}
2458
2459
builder.accessChainPush(index, coherent_flags,
2460
node->getLeft()->getType().getBufferReferenceAlignment());
2461
}
2462
}
2463
return false;
2464
case glslang::EOpVectorSwizzle:
2465
{
2466
node->getLeft()->traverse(this);
2467
std::vector<unsigned> swizzle;
2468
convertSwizzle(*node->getRight()->getAsAggregate(), swizzle);
2469
int dummySize;
2470
builder.accessChainPushSwizzle(swizzle, convertGlslangToSpvType(node->getLeft()->getType()),
2471
TranslateCoherent(node->getLeft()->getType()),
2472
glslangIntermediate->getBaseAlignmentScalar(node->getLeft()->getType(),
2473
dummySize));
2474
}
2475
return false;
2476
case glslang::EOpMatrixSwizzle:
2477
logger->missingFunctionality("matrix swizzle");
2478
return true;
2479
case glslang::EOpLogicalOr:
2480
case glslang::EOpLogicalAnd:
2481
{
2482
2483
// These may require short circuiting, but can sometimes be done as straight
2484
// binary operations. The right operand must be short circuited if it has
2485
// side effects, and should probably be if it is complex.
2486
if (isTrivial(node->getRight()->getAsTyped()))
2487
break; // handle below as a normal binary operation
2488
// otherwise, we need to do dynamic short circuiting on the right operand
2489
spv::Id result = createShortCircuit(node->getOp(), *node->getLeft()->getAsTyped(),
2490
*node->getRight()->getAsTyped());
2491
builder.clearAccessChain();
2492
builder.setAccessChainRValue(result);
2493
}
2494
return false;
2495
default:
2496
break;
2497
}
2498
2499
// Assume generic binary op...
2500
2501
// get right operand
2502
builder.clearAccessChain();
2503
node->getLeft()->traverse(this);
2504
spv::Id left = accessChainLoad(node->getLeft()->getType());
2505
2506
// get left operand
2507
builder.clearAccessChain();
2508
node->getRight()->traverse(this);
2509
spv::Id right = accessChainLoad(node->getRight()->getType());
2510
2511
// get result
2512
OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
2513
TranslateNoContractionDecoration(node->getType().getQualifier()),
2514
TranslateNonUniformDecoration(node->getType().getQualifier()) };
2515
spv::Id result = createBinaryOperation(node->getOp(), decorations,
2516
convertGlslangToSpvType(node->getType()), left, right,
2517
node->getLeft()->getType().getBasicType());
2518
2519
builder.clearAccessChain();
2520
if (! result) {
2521
logger->missingFunctionality("unknown glslang binary operation");
2522
return true; // pick up a child as the place-holder result
2523
} else {
2524
builder.setAccessChainRValue(result);
2525
return false;
2526
}
2527
}
2528
2529
spv::Id TGlslangToSpvTraverser::convertLoadedBoolInUniformToUint(const glslang::TType& type,
2530
spv::Id nominalTypeId,
2531
spv::Id loadedId)
2532
{
2533
if (builder.isScalarType(nominalTypeId)) {
2534
// Conversion for bool
2535
spv::Id boolType = builder.makeBoolType();
2536
if (nominalTypeId != boolType)
2537
return builder.createBinOp(spv::Op::OpINotEqual, boolType, loadedId, builder.makeUintConstant(0));
2538
} else if (builder.isVectorType(nominalTypeId)) {
2539
// Conversion for bvec
2540
int vecSize = builder.getNumTypeComponents(nominalTypeId);
2541
spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);
2542
if (nominalTypeId != bvecType)
2543
loadedId = builder.createBinOp(spv::Op::OpINotEqual, bvecType, loadedId,
2544
makeSmearedConstant(builder.makeUintConstant(0), vecSize));
2545
} else if (builder.isArrayType(nominalTypeId)) {
2546
// Conversion for bool array
2547
spv::Id boolArrayTypeId = convertGlslangToSpvType(type);
2548
if (nominalTypeId != boolArrayTypeId)
2549
{
2550
// Use OpCopyLogical from SPIR-V 1.4 if available.
2551
if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4)
2552
return builder.createUnaryOp(spv::Op::OpCopyLogical, boolArrayTypeId, loadedId);
2553
2554
glslang::TType glslangElementType(type, 0);
2555
spv::Id elementNominalTypeId = builder.getContainedTypeId(nominalTypeId);
2556
std::vector<spv::Id> constituents;
2557
for (int index = 0; index < type.getOuterArraySize(); ++index) {
2558
// get the element
2559
spv::Id elementValue = builder.createCompositeExtract(loadedId, elementNominalTypeId, index);
2560
2561
// recursively convert it
2562
spv::Id elementConvertedValue = convertLoadedBoolInUniformToUint(glslangElementType, elementNominalTypeId, elementValue);
2563
constituents.push_back(elementConvertedValue);
2564
}
2565
return builder.createCompositeConstruct(boolArrayTypeId, constituents);
2566
}
2567
}
2568
2569
return loadedId;
2570
}
2571
2572
// Figure out what, if any, type changes are needed when accessing a specific built-in.
2573
// Returns <the type SPIR-V requires for declarion, the type to translate to on use>.
2574
// Also see comment for 'forceType', regarding tracking SPIR-V-required types.
2575
std::pair<spv::Id, spv::Id> TGlslangToSpvTraverser::getForcedType(glslang::TBuiltInVariable glslangBuiltIn,
2576
const glslang::TType& glslangType)
2577
{
2578
switch(glslangBuiltIn)
2579
{
2580
case glslang::EbvSubGroupEqMask:
2581
case glslang::EbvSubGroupGeMask:
2582
case glslang::EbvSubGroupGtMask:
2583
case glslang::EbvSubGroupLeMask:
2584
case glslang::EbvSubGroupLtMask: {
2585
// these require changing a 64-bit scaler -> a vector of 32-bit components
2586
if (glslangType.isVector())
2587
break;
2588
spv::Id ivec4_type = builder.makeVectorType(builder.makeUintType(32), 4);
2589
spv::Id uint64_type = builder.makeUintType(64);
2590
std::pair<spv::Id, spv::Id> ret(ivec4_type, uint64_type);
2591
return ret;
2592
}
2593
// There are no SPIR-V builtins defined for these and map onto original non-transposed
2594
// builtins. During visitBinary we insert a transpose
2595
case glslang::EbvWorldToObject3x4:
2596
case glslang::EbvObjectToWorld3x4: {
2597
spv::Id mat43 = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
2598
spv::Id mat34 = builder.makeMatrixType(builder.makeFloatType(32), 3, 4);
2599
std::pair<spv::Id, spv::Id> ret(mat43, mat34);
2600
return ret;
2601
}
2602
default:
2603
break;
2604
}
2605
2606
std::pair<spv::Id, spv::Id> ret(spv::NoType, spv::NoType);
2607
return ret;
2608
}
2609
2610
// For an object previously identified (see getForcedType() and forceType)
2611
// as needing type translations, do the translation needed for a load, turning
2612
// an L-value into in R-value.
2613
spv::Id TGlslangToSpvTraverser::translateForcedType(spv::Id object)
2614
{
2615
const auto forceIt = forceType.find(object);
2616
if (forceIt == forceType.end())
2617
return object;
2618
2619
spv::Id desiredTypeId = forceIt->second;
2620
spv::Id objectTypeId = builder.getTypeId(object);
2621
assert(builder.isPointerType(objectTypeId));
2622
objectTypeId = builder.getContainedTypeId(objectTypeId);
2623
if (builder.isVectorType(objectTypeId) &&
2624
builder.getScalarTypeWidth(builder.getContainedTypeId(objectTypeId)) == 32) {
2625
if (builder.getScalarTypeWidth(desiredTypeId) == 64) {
2626
// handle 32-bit v.xy* -> 64-bit
2627
builder.clearAccessChain();
2628
builder.setAccessChainLValue(object);
2629
object = builder.accessChainLoad(spv::NoPrecision, spv::Decoration::Max, spv::Decoration::Max, objectTypeId);
2630
std::vector<spv::Id> components;
2631
components.push_back(builder.createCompositeExtract(object, builder.getContainedTypeId(objectTypeId), 0));
2632
components.push_back(builder.createCompositeExtract(object, builder.getContainedTypeId(objectTypeId), 1));
2633
2634
spv::Id vecType = builder.makeVectorType(builder.getContainedTypeId(objectTypeId), 2);
2635
return builder.createUnaryOp(spv::Op::OpBitcast, desiredTypeId,
2636
builder.createCompositeConstruct(vecType, components));
2637
} else {
2638
logger->missingFunctionality("forcing 32-bit vector type to non 64-bit scalar");
2639
}
2640
} else if (builder.isMatrixType(objectTypeId)) {
2641
// There are no SPIR-V builtins defined for 3x4 variants of ObjectToWorld/WorldToObject
2642
// and we insert a transpose after loading the original non-transposed builtins
2643
builder.clearAccessChain();
2644
builder.setAccessChainLValue(object);
2645
object = builder.accessChainLoad(spv::NoPrecision, spv::Decoration::Max, spv::Decoration::Max, objectTypeId);
2646
return builder.createUnaryOp(spv::Op::OpTranspose, desiredTypeId, object);
2647
2648
} else {
2649
logger->missingFunctionality("forcing non 32-bit vector type");
2650
}
2651
2652
return object;
2653
}
2654
2655
bool TGlslangToSpvTraverser::visitUnary(glslang::TVisit /* visit */, glslang::TIntermUnary* node)
2656
{
2657
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
2658
2659
SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
2660
if (node->getType().getQualifier().isSpecConstant())
2661
spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
2662
2663
spv::Id result = spv::NoResult;
2664
2665
// try texturing first
2666
result = createImageTextureFunctionCall(node);
2667
if (result != spv::NoResult) {
2668
builder.clearAccessChain();
2669
builder.setAccessChainRValue(result);
2670
2671
return false; // done with this node
2672
}
2673
2674
// Non-texturing.
2675
2676
if (node->getOp() == glslang::EOpArrayLength) {
2677
// Quite special; won't want to evaluate the operand.
2678
2679
// Currently, the front-end does not allow .length() on an array until it is sized,
2680
// except for the last block membeor of an SSBO.
2681
// TODO: If this changes, link-time sized arrays might show up here, and need their
2682
// size extracted.
2683
2684
// Normal .length() would have been constant folded by the front-end.
2685
// So, this has to be block.lastMember.length().
2686
// SPV wants "block" and member number as the operands, go get them.
2687
2688
uint32_t bits = node->getType().contains64BitInt() ? 64 : 32;
2689
2690
spv::Id length;
2691
if (node->getOperand()->getType().isCoopMat()) {
2692
spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());
2693
assert(builder.isCooperativeMatrixType(typeId));
2694
2695
if (node->getOperand()->getType().isCoopMatKHR()) {
2696
length = builder.createCooperativeMatrixLengthKHR(typeId);
2697
} else {
2698
spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
2699
length = builder.createCooperativeMatrixLengthNV(typeId);
2700
}
2701
} else if (node->getOperand()->getType().isCoopVecNV()) {
2702
spv::Id typeId = convertGlslangToSpvType(node->getOperand()->getType());
2703
length = builder.getCooperativeVectorNumComponents(typeId);
2704
} else {
2705
glslang::TIntermTyped* block = node->getOperand()->getAsBinaryNode()->getLeft();
2706
block->traverse(this);
2707
unsigned int member = node->getOperand()->getAsBinaryNode()->getRight()->getAsConstantUnion()
2708
->getConstArray()[0].getUConst();
2709
length = builder.createArrayLength(builder.accessChainGetLValue(), member, bits);
2710
}
2711
2712
// GLSL semantics say the result of .length() is an int, while SPIR-V says
2713
// signedness must be 0. So, convert from SPIR-V unsigned back to GLSL's
2714
// AST expectation of a signed result.
2715
if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
2716
if (builder.isInSpecConstCodeGenMode()) {
2717
length = builder.createBinOp(spv::Op::OpIAdd, builder.makeIntType(bits), length, builder.makeIntConstant(0));
2718
} else {
2719
length = builder.createUnaryOp(spv::Op::OpBitcast, builder.makeIntType(bits), length);
2720
}
2721
}
2722
2723
builder.clearAccessChain();
2724
builder.setAccessChainRValue(length);
2725
2726
return false;
2727
}
2728
2729
// Force variable declaration - Debug Mode Only
2730
if (node->getOp() == glslang::EOpDeclare) {
2731
builder.clearAccessChain();
2732
node->getOperand()->traverse(this);
2733
builder.clearAccessChain();
2734
return false;
2735
}
2736
2737
// Start by evaluating the operand
2738
2739
// Does it need a swizzle inversion? If so, evaluation is inverted;
2740
// operate first on the swizzle base, then apply the swizzle.
2741
spv::Id invertedType = spv::NoType;
2742
auto resultType = [&invertedType, &node, this](){ return invertedType != spv::NoType ?
2743
invertedType : convertGlslangToSpvType(node->getType()); };
2744
if (node->getOp() == glslang::EOpInterpolateAtCentroid)
2745
invertedType = getInvertedSwizzleType(*node->getOperand());
2746
2747
builder.clearAccessChain();
2748
TIntermNode *operandNode;
2749
if (invertedType != spv::NoType)
2750
operandNode = node->getOperand()->getAsBinaryNode()->getLeft();
2751
else
2752
operandNode = node->getOperand();
2753
2754
operandNode->traverse(this);
2755
2756
spv::Id operand = spv::NoResult;
2757
2758
spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
2759
2760
const auto hitObjectOpsWithLvalue = [](glslang::TOperator op) {
2761
switch(op) {
2762
case glslang::EOpReorderThreadNV:
2763
case glslang::EOpHitObjectGetCurrentTimeNV:
2764
case glslang::EOpHitObjectGetHitKindNV:
2765
case glslang::EOpHitObjectGetPrimitiveIndexNV:
2766
case glslang::EOpHitObjectGetGeometryIndexNV:
2767
case glslang::EOpHitObjectGetInstanceIdNV:
2768
case glslang::EOpHitObjectGetInstanceCustomIndexNV:
2769
case glslang::EOpHitObjectGetObjectRayDirectionNV:
2770
case glslang::EOpHitObjectGetObjectRayOriginNV:
2771
case glslang::EOpHitObjectGetWorldRayDirectionNV:
2772
case glslang::EOpHitObjectGetWorldRayOriginNV:
2773
case glslang::EOpHitObjectGetWorldToObjectNV:
2774
case glslang::EOpHitObjectGetObjectToWorldNV:
2775
case glslang::EOpHitObjectGetRayTMaxNV:
2776
case glslang::EOpHitObjectGetRayTMinNV:
2777
case glslang::EOpHitObjectIsEmptyNV:
2778
case glslang::EOpHitObjectIsHitNV:
2779
case glslang::EOpHitObjectIsMissNV:
2780
case glslang::EOpHitObjectRecordEmptyNV:
2781
case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
2782
case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
2783
case glslang::EOpHitObjectGetClusterIdNV:
2784
case glslang::EOpHitObjectGetSpherePositionNV:
2785
case glslang::EOpHitObjectGetSphereRadiusNV:
2786
case glslang::EOpHitObjectIsSphereHitNV:
2787
case glslang::EOpHitObjectIsLSSHitNV:
2788
case glslang::EOpReorderThreadEXT:
2789
case glslang::EOpHitObjectGetCurrentTimeEXT:
2790
case glslang::EOpHitObjectGetHitKindEXT:
2791
case glslang::EOpHitObjectGetPrimitiveIndexEXT:
2792
case glslang::EOpHitObjectGetGeometryIndexEXT:
2793
case glslang::EOpHitObjectGetInstanceIdEXT:
2794
case glslang::EOpHitObjectGetInstanceCustomIndexEXT:
2795
case glslang::EOpHitObjectGetObjectRayDirectionEXT:
2796
case glslang::EOpHitObjectGetObjectRayOriginEXT:
2797
case glslang::EOpHitObjectGetWorldRayDirectionEXT:
2798
case glslang::EOpHitObjectGetWorldRayOriginEXT:
2799
case glslang::EOpHitObjectGetWorldToObjectEXT:
2800
case glslang::EOpHitObjectGetObjectToWorldEXT:
2801
case glslang::EOpHitObjectGetRayTMaxEXT:
2802
case glslang::EOpHitObjectGetRayTMinEXT:
2803
case glslang::EOpHitObjectGetRayFlagsEXT:
2804
case glslang::EOpHitObjectIsEmptyEXT:
2805
case glslang::EOpHitObjectIsHitEXT:
2806
case glslang::EOpHitObjectIsMissEXT:
2807
case glslang::EOpHitObjectRecordEmptyEXT:
2808
case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:
2809
case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:
2810
return true;
2811
default:
2812
return false;
2813
}
2814
};
2815
2816
if (node->getOp() == glslang::EOpAtomicCounterIncrement ||
2817
node->getOp() == glslang::EOpAtomicCounterDecrement ||
2818
node->getOp() == glslang::EOpAtomicCounter ||
2819
(node->getOp() == glslang::EOpInterpolateAtCentroid &&
2820
glslangIntermediate->getSource() != glslang::EShSourceHlsl) ||
2821
node->getOp() == glslang::EOpRayQueryProceed ||
2822
node->getOp() == glslang::EOpRayQueryGetRayTMin ||
2823
node->getOp() == glslang::EOpRayQueryGetRayFlags ||
2824
node->getOp() == glslang::EOpRayQueryGetWorldRayOrigin ||
2825
node->getOp() == glslang::EOpRayQueryGetWorldRayDirection ||
2826
node->getOp() == glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque ||
2827
node->getOp() == glslang::EOpRayQueryTerminate ||
2828
node->getOp() == glslang::EOpRayQueryConfirmIntersection ||
2829
(node->getOp() == glslang::EOpSpirvInst && operandNode->getAsTyped()->getQualifier().isSpirvByReference()) ||
2830
hitObjectOpsWithLvalue(node->getOp())) {
2831
operand = builder.accessChainGetLValue(); // Special case l-value operands
2832
lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
2833
lvalueCoherentFlags |= TranslateCoherent(operandNode->getAsTyped()->getType());
2834
} else if (operandNode->getAsTyped()->getQualifier().isSpirvLiteral()) {
2835
// Will be translated to a literal value, make a placeholder here
2836
operand = spv::NoResult;
2837
} else {
2838
operand = accessChainLoad(node->getOperand()->getType());
2839
}
2840
2841
OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
2842
TranslateNoContractionDecoration(node->getType().getQualifier()),
2843
TranslateNonUniformDecoration(node->getType().getQualifier()) };
2844
2845
// it could be a conversion
2846
if (! result) {
2847
result = createConversion(node->getOp(), decorations, resultType(), operand,
2848
node->getType().getBasicType(), node->getOperand()->getBasicType());
2849
if (result) {
2850
if (node->getType().isCoopMatKHR() && node->getOperand()->getAsTyped()->getType().isCoopMatKHR() &&
2851
!node->getAsTyped()->getType().sameCoopMatUse(node->getOperand()->getAsTyped()->getType())) {
2852
// Conversions that change use need CapabilityCooperativeMatrixConversionsNV
2853
builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
2854
builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
2855
}
2856
}
2857
}
2858
2859
// if not, then possibly an operation
2860
if (! result)
2861
result = createUnaryOperation(node->getOp(), decorations, resultType(), operand,
2862
node->getOperand()->getBasicType(), lvalueCoherentFlags, node->getType());
2863
2864
// it could be attached to a SPIR-V intruction
2865
if (!result) {
2866
if (node->getOp() == glslang::EOpSpirvInst) {
2867
const auto& spirvInst = node->getSpirvInstruction();
2868
if (spirvInst.set == "") {
2869
spv::IdImmediate idImmOp = {true, operand};
2870
if (operandNode->getAsTyped()->getQualifier().isSpirvLiteral()) {
2871
// Translate the constant to a literal value
2872
std::vector<unsigned> literals;
2873
glslang::TVector<const glslang::TIntermConstantUnion*> constants;
2874
constants.push_back(operandNode->getAsConstantUnion());
2875
TranslateLiterals(constants, literals);
2876
idImmOp = {false, literals[0]};
2877
}
2878
2879
if (node->getBasicType() == glslang::EbtVoid)
2880
builder.createNoResultOp(static_cast<spv::Op>(spirvInst.id), {idImmOp});
2881
else
2882
result = builder.createOp(static_cast<spv::Op>(spirvInst.id), resultType(), {idImmOp});
2883
} else {
2884
result = builder.createBuiltinCall(
2885
resultType(), spirvInst.set == "GLSL.std.450" ? stdBuiltins : getExtBuiltins(spirvInst.set.c_str()),
2886
spirvInst.id, {operand});
2887
}
2888
2889
if (node->getBasicType() == glslang::EbtVoid)
2890
return false; // done with this node
2891
}
2892
}
2893
2894
if (result) {
2895
if (invertedType) {
2896
result = createInvertedSwizzle(decorations.precision, *node->getOperand(), result);
2897
decorations.addNonUniform(builder, result);
2898
}
2899
2900
builder.clearAccessChain();
2901
builder.setAccessChainRValue(result);
2902
2903
return false; // done with this node
2904
}
2905
2906
// it must be a special case, check...
2907
switch (node->getOp()) {
2908
case glslang::EOpPostIncrement:
2909
case glslang::EOpPostDecrement:
2910
case glslang::EOpPreIncrement:
2911
case glslang::EOpPreDecrement:
2912
{
2913
// we need the integer value "1" or the floating point "1.0" to add/subtract
2914
spv::Id one = 0;
2915
if (node->getBasicType() == glslang::EbtFloat)
2916
one = builder.makeFloatConstant(1.0F);
2917
else if (node->getBasicType() == glslang::EbtDouble)
2918
one = builder.makeDoubleConstant(1.0);
2919
else if (node->getBasicType() == glslang::EbtFloat16)
2920
one = builder.makeFloat16Constant(1.0F);
2921
else if (node->getBasicType() == glslang::EbtBFloat16)
2922
one = builder.makeBFloat16Constant(1.0F);
2923
else if (node->getBasicType() == glslang::EbtFloatE5M2)
2924
one = builder.makeFloatE5M2Constant(1.0F);
2925
else if (node->getBasicType() == glslang::EbtFloatE4M3)
2926
one = builder.makeFloatE4M3Constant(1.0F);
2927
else if (node->getBasicType() == glslang::EbtInt8 || node->getBasicType() == glslang::EbtUint8)
2928
one = builder.makeInt8Constant(1);
2929
else if (node->getBasicType() == glslang::EbtInt16 || node->getBasicType() == glslang::EbtUint16)
2930
one = builder.makeInt16Constant(1);
2931
else if (node->getBasicType() == glslang::EbtInt64 || node->getBasicType() == glslang::EbtUint64)
2932
one = builder.makeInt64Constant(1);
2933
else
2934
one = builder.makeIntConstant(1);
2935
glslang::TOperator op;
2936
if (node->getOp() == glslang::EOpPreIncrement ||
2937
node->getOp() == glslang::EOpPostIncrement)
2938
op = glslang::EOpAdd;
2939
else
2940
op = glslang::EOpSub;
2941
2942
spv::Id result = createBinaryOperation(op, decorations,
2943
convertGlslangToSpvType(node->getType()), operand, one,
2944
node->getType().getBasicType());
2945
assert(result != spv::NoResult);
2946
2947
// The result of operation is always stored, but conditionally the
2948
// consumed result. The consumed result is always an r-value.
2949
builder.accessChainStore(result,
2950
TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags));
2951
builder.clearAccessChain();
2952
if (node->getOp() == glslang::EOpPreIncrement ||
2953
node->getOp() == glslang::EOpPreDecrement)
2954
builder.setAccessChainRValue(result);
2955
else
2956
builder.setAccessChainRValue(operand);
2957
}
2958
2959
return false;
2960
2961
case glslang::EOpAssumeEXT:
2962
builder.addCapability(spv::Capability::ExpectAssumeKHR);
2963
builder.addExtension(spv::E_SPV_KHR_expect_assume);
2964
builder.createNoResultOp(spv::Op::OpAssumeTrueKHR, operand);
2965
return false;
2966
case glslang::EOpEmitStreamVertex:
2967
builder.createNoResultOp(spv::Op::OpEmitStreamVertex, operand);
2968
return false;
2969
case glslang::EOpEndStreamPrimitive:
2970
builder.createNoResultOp(spv::Op::OpEndStreamPrimitive, operand);
2971
return false;
2972
case glslang::EOpRayQueryTerminate:
2973
builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR, operand);
2974
return false;
2975
case glslang::EOpRayQueryConfirmIntersection:
2976
builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR, operand);
2977
return false;
2978
case glslang::EOpReorderThreadNV:
2979
builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectNV, operand);
2980
return false;
2981
case glslang::EOpReorderThreadEXT:
2982
builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectEXT, operand);
2983
return false;
2984
case glslang::EOpHitObjectRecordEmptyNV:
2985
builder.createNoResultOp(spv::Op::OpHitObjectRecordEmptyNV, operand);
2986
return false;
2987
case glslang::EOpHitObjectRecordEmptyEXT:
2988
builder.createNoResultOp(spv::Op::OpHitObjectRecordEmptyEXT, operand);
2989
return false;
2990
2991
case glslang::EOpCreateTensorLayoutNV:
2992
result = builder.createOp(spv::Op::OpCreateTensorLayoutNV, resultType(), std::vector<spv::Id>{});
2993
builder.clearAccessChain();
2994
builder.setAccessChainRValue(result);
2995
return false;
2996
2997
case glslang::EOpCreateTensorViewNV:
2998
result = builder.createOp(spv::Op::OpCreateTensorViewNV, resultType(), std::vector<spv::Id>{});
2999
builder.clearAccessChain();
3000
builder.setAccessChainRValue(result);
3001
return false;
3002
3003
default:
3004
logger->missingFunctionality("unknown glslang unary");
3005
return true; // pick up operand as placeholder result
3006
}
3007
}
3008
3009
// Construct a composite object, recursively copying members if their types don't match
3010
spv::Id TGlslangToSpvTraverser::createCompositeConstruct(spv::Id resultTypeId, std::vector<spv::Id> constituents)
3011
{
3012
for (int c = 0; c < (int)constituents.size(); ++c) {
3013
spv::Id& constituent = constituents[c];
3014
spv::Id lType = builder.getContainedTypeId(resultTypeId, c);
3015
spv::Id rType = builder.getTypeId(constituent);
3016
if (lType != rType) {
3017
if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
3018
constituent = builder.createUnaryOp(spv::Op::OpCopyLogical, lType, constituent);
3019
} else if (builder.isStructType(rType)) {
3020
std::vector<spv::Id> rTypeConstituents;
3021
int numrTypeConstituents = builder.getNumTypeConstituents(rType);
3022
for (int i = 0; i < numrTypeConstituents; ++i) {
3023
rTypeConstituents.push_back(builder.createCompositeExtract(constituent,
3024
builder.getContainedTypeId(rType, i), i));
3025
}
3026
constituents[c] = createCompositeConstruct(lType, rTypeConstituents);
3027
} else {
3028
assert(builder.isArrayType(rType));
3029
std::vector<spv::Id> rTypeConstituents;
3030
int numrTypeConstituents = builder.getNumTypeConstituents(rType);
3031
3032
spv::Id elementRType = builder.getContainedTypeId(rType);
3033
for (int i = 0; i < numrTypeConstituents; ++i) {
3034
rTypeConstituents.push_back(builder.createCompositeExtract(constituent, elementRType, i));
3035
}
3036
constituents[c] = createCompositeConstruct(lType, rTypeConstituents);
3037
}
3038
}
3039
}
3040
return builder.createCompositeConstruct(resultTypeId, constituents);
3041
}
3042
3043
bool TGlslangToSpvTraverser::visitAggregate(glslang::TVisit visit, glslang::TIntermAggregate* node)
3044
{
3045
SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
3046
if (node->getType().getQualifier().isSpecConstant())
3047
spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
3048
3049
spv::Id result = spv::NoResult;
3050
spv::Id invertedType = spv::NoType; // to use to override the natural type of the node
3051
std::vector<spv::Builder::AccessChain> complexLvalues; // for holding swizzling l-values too complex for
3052
// SPIR-V, for an out parameter
3053
std::vector<spv::Id> temporaryLvalues; // temporaries to pass, as proxies for complexLValues
3054
3055
auto resultType = [&invertedType, &node, this](){
3056
if (invertedType != spv::NoType) {
3057
return invertedType;
3058
} else {
3059
auto ret = convertGlslangToSpvType(node->getType());
3060
// convertGlslangToSpvType may clobber the debug location, reset it
3061
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
3062
return ret;
3063
}
3064
};
3065
3066
// try texturing
3067
result = createImageTextureFunctionCall(node);
3068
if (result != spv::NoResult) {
3069
builder.clearAccessChain();
3070
builder.setAccessChainRValue(result);
3071
3072
return false;
3073
} else if (node->getOp() == glslang::EOpImageStore ||
3074
node->getOp() == glslang::EOpImageStoreLod ||
3075
node->getOp() == glslang::EOpImageAtomicStore) {
3076
// "imageStore" is a special case, which has no result
3077
return false;
3078
}
3079
3080
glslang::TOperator binOp = glslang::EOpNull;
3081
bool reduceComparison = true;
3082
bool isMatrix = false;
3083
bool noReturnValue = false;
3084
bool atomic = false;
3085
3086
spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
3087
3088
assert(node->getOp());
3089
3090
spv::Decoration precision = TranslatePrecisionDecoration(node->getOperationPrecision());
3091
3092
switch (node->getOp()) {
3093
case glslang::EOpScope:
3094
case glslang::EOpSequence:
3095
{
3096
if (visit == glslang::EvPreVisit) {
3097
++sequenceDepth;
3098
if (sequenceDepth == 1) {
3099
// If this is the parent node of all the functions, we want to see them
3100
// early, so all call points have actual SPIR-V functions to reference.
3101
// In all cases, still let the traverser visit the children for us.
3102
makeFunctions(node->getAsAggregate()->getSequence());
3103
3104
// Global initializers is specific to the shader entry point, which does not exist in compile-only mode
3105
if (!options.compileOnly) {
3106
// Also, we want all globals initializers to go into the beginning of the entry point, before
3107
// anything else gets there, so visit out of order, doing them all now.
3108
makeGlobalInitializers(node->getAsAggregate()->getSequence());
3109
}
3110
3111
//Pre process linker objects for ray tracing stages
3112
if (glslangIntermediate->isRayTracingStage())
3113
collectRayTracingLinkerObjects();
3114
3115
// Initializers are done, don't want to visit again, but functions and link objects need to be processed,
3116
// so do them manually.
3117
visitFunctions(node->getAsAggregate()->getSequence());
3118
3119
return false;
3120
} else {
3121
if (node->getOp() == glslang::EOpScope) {
3122
auto loc = node->getLoc();
3123
builder.enterLexicalBlock(loc.line, loc.column);
3124
}
3125
}
3126
} else {
3127
if (sequenceDepth > 1 && node->getOp() == glslang::EOpScope)
3128
builder.leaveLexicalBlock();
3129
--sequenceDepth;
3130
}
3131
3132
return true;
3133
}
3134
case glslang::EOpLinkerObjects:
3135
{
3136
if (visit == glslang::EvPreVisit)
3137
linkageOnly = true;
3138
else
3139
linkageOnly = false;
3140
3141
return true;
3142
}
3143
case glslang::EOpComma:
3144
{
3145
// processing from left to right naturally leaves the right-most
3146
// lying around in the access chain
3147
glslang::TIntermSequence& glslangOperands = node->getSequence();
3148
for (int i = 0; i < (int)glslangOperands.size(); ++i)
3149
glslangOperands[i]->traverse(this);
3150
3151
return false;
3152
}
3153
case glslang::EOpFunction:
3154
if (visit == glslang::EvPreVisit) {
3155
if (options.generateDebugInfo) {
3156
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
3157
}
3158
if (isShaderEntryPoint(node)) {
3159
inEntryPoint = true;
3160
builder.setBuildPoint(shaderEntry->getLastBlock());
3161
builder.enterFunction(shaderEntry);
3162
currentFunction = shaderEntry;
3163
} else {
3164
// SPIR-V functions should already be in the functionMap from the prepass
3165
// that called makeFunctions().
3166
currentFunction = functionMap[node->getName().c_str()];
3167
spv::Block* functionBlock = currentFunction->getEntryBlock();
3168
builder.setBuildPoint(functionBlock);
3169
builder.enterFunction(currentFunction);
3170
}
3171
if (options.generateDebugInfo && !options.emitNonSemanticShaderDebugInfo) {
3172
const auto& loc = node->getLoc();
3173
const char* sourceFileName = loc.getFilename();
3174
spv::Id sourceFileId = sourceFileName ? builder.getStringId(sourceFileName) : builder.getMainFileId();
3175
currentFunction->setDebugLineInfo(sourceFileId, loc.line, loc.column);
3176
}
3177
} else {
3178
// Here we have finished visiting the function (post-visit). Finalize it.
3179
if (options.generateDebugInfo) {
3180
if (glslangIntermediate->getSource() == glslang::EShSourceGlsl && node->getSequence().size() > 1) {
3181
auto endLoc = node->getSequence()[1]->getAsAggregate()->getEndLoc();
3182
builder.setDebugSourceLocation(endLoc.line, endLoc.getFilename());
3183
}
3184
}
3185
if (inEntryPoint)
3186
entryPointTerminated = true;
3187
builder.leaveFunction();
3188
inEntryPoint = false;
3189
currentFunction = nullptr;
3190
}
3191
3192
return true;
3193
case glslang::EOpParameters:
3194
// Parameters will have been consumed by EOpFunction processing, but not
3195
// the body, so we still visited the function node's children, making this
3196
// child redundant.
3197
return false;
3198
case glslang::EOpFunctionCall:
3199
{
3200
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
3201
if (node->isUserDefined())
3202
result = handleUserFunctionCall(node);
3203
if (result) {
3204
builder.clearAccessChain();
3205
builder.setAccessChainRValue(result);
3206
} else
3207
logger->missingFunctionality("missing user function; linker needs to catch that");
3208
3209
return false;
3210
}
3211
case glslang::EOpConstructMat2x2:
3212
case glslang::EOpConstructMat2x3:
3213
case glslang::EOpConstructMat2x4:
3214
case glslang::EOpConstructMat3x2:
3215
case glslang::EOpConstructMat3x3:
3216
case glslang::EOpConstructMat3x4:
3217
case glslang::EOpConstructMat4x2:
3218
case glslang::EOpConstructMat4x3:
3219
case glslang::EOpConstructMat4x4:
3220
case glslang::EOpConstructDMat2x2:
3221
case glslang::EOpConstructDMat2x3:
3222
case glslang::EOpConstructDMat2x4:
3223
case glslang::EOpConstructDMat3x2:
3224
case glslang::EOpConstructDMat3x3:
3225
case glslang::EOpConstructDMat3x4:
3226
case glslang::EOpConstructDMat4x2:
3227
case glslang::EOpConstructDMat4x3:
3228
case glslang::EOpConstructDMat4x4:
3229
case glslang::EOpConstructIMat2x2:
3230
case glslang::EOpConstructIMat2x3:
3231
case glslang::EOpConstructIMat2x4:
3232
case glslang::EOpConstructIMat3x2:
3233
case glslang::EOpConstructIMat3x3:
3234
case glslang::EOpConstructIMat3x4:
3235
case glslang::EOpConstructIMat4x2:
3236
case glslang::EOpConstructIMat4x3:
3237
case glslang::EOpConstructIMat4x4:
3238
case glslang::EOpConstructUMat2x2:
3239
case glslang::EOpConstructUMat2x3:
3240
case glslang::EOpConstructUMat2x4:
3241
case glslang::EOpConstructUMat3x2:
3242
case glslang::EOpConstructUMat3x3:
3243
case glslang::EOpConstructUMat3x4:
3244
case glslang::EOpConstructUMat4x2:
3245
case glslang::EOpConstructUMat4x3:
3246
case glslang::EOpConstructUMat4x4:
3247
case glslang::EOpConstructBMat2x2:
3248
case glslang::EOpConstructBMat2x3:
3249
case glslang::EOpConstructBMat2x4:
3250
case glslang::EOpConstructBMat3x2:
3251
case glslang::EOpConstructBMat3x3:
3252
case glslang::EOpConstructBMat3x4:
3253
case glslang::EOpConstructBMat4x2:
3254
case glslang::EOpConstructBMat4x3:
3255
case glslang::EOpConstructBMat4x4:
3256
case glslang::EOpConstructF16Mat2x2:
3257
case glslang::EOpConstructF16Mat2x3:
3258
case glslang::EOpConstructF16Mat2x4:
3259
case glslang::EOpConstructF16Mat3x2:
3260
case glslang::EOpConstructF16Mat3x3:
3261
case glslang::EOpConstructF16Mat3x4:
3262
case glslang::EOpConstructF16Mat4x2:
3263
case glslang::EOpConstructF16Mat4x3:
3264
case glslang::EOpConstructF16Mat4x4:
3265
isMatrix = true;
3266
[[fallthrough]];
3267
case glslang::EOpConstructFloat:
3268
case glslang::EOpConstructVec2:
3269
case glslang::EOpConstructVec3:
3270
case glslang::EOpConstructVec4:
3271
case glslang::EOpConstructDouble:
3272
case glslang::EOpConstructDVec2:
3273
case glslang::EOpConstructDVec3:
3274
case glslang::EOpConstructDVec4:
3275
case glslang::EOpConstructFloat16:
3276
case glslang::EOpConstructF16Vec2:
3277
case glslang::EOpConstructF16Vec3:
3278
case glslang::EOpConstructF16Vec4:
3279
case glslang::EOpConstructBFloat16:
3280
case glslang::EOpConstructBF16Vec2:
3281
case glslang::EOpConstructBF16Vec3:
3282
case glslang::EOpConstructBF16Vec4:
3283
case glslang::EOpConstructFloatE5M2:
3284
case glslang::EOpConstructFloatE5M2Vec2:
3285
case glslang::EOpConstructFloatE5M2Vec3:
3286
case glslang::EOpConstructFloatE5M2Vec4:
3287
case glslang::EOpConstructFloatE4M3:
3288
case glslang::EOpConstructFloatE4M3Vec2:
3289
case glslang::EOpConstructFloatE4M3Vec3:
3290
case glslang::EOpConstructFloatE4M3Vec4:
3291
case glslang::EOpConstructBool:
3292
case glslang::EOpConstructBVec2:
3293
case glslang::EOpConstructBVec3:
3294
case glslang::EOpConstructBVec4:
3295
case glslang::EOpConstructInt8:
3296
case glslang::EOpConstructI8Vec2:
3297
case glslang::EOpConstructI8Vec3:
3298
case glslang::EOpConstructI8Vec4:
3299
case glslang::EOpConstructUint8:
3300
case glslang::EOpConstructU8Vec2:
3301
case glslang::EOpConstructU8Vec3:
3302
case glslang::EOpConstructU8Vec4:
3303
case glslang::EOpConstructInt16:
3304
case glslang::EOpConstructI16Vec2:
3305
case glslang::EOpConstructI16Vec3:
3306
case glslang::EOpConstructI16Vec4:
3307
case glslang::EOpConstructUint16:
3308
case glslang::EOpConstructU16Vec2:
3309
case glslang::EOpConstructU16Vec3:
3310
case glslang::EOpConstructU16Vec4:
3311
case glslang::EOpConstructInt:
3312
case glslang::EOpConstructIVec2:
3313
case glslang::EOpConstructIVec3:
3314
case glslang::EOpConstructIVec4:
3315
case glslang::EOpConstructUint:
3316
case glslang::EOpConstructUVec2:
3317
case glslang::EOpConstructUVec3:
3318
case glslang::EOpConstructUVec4:
3319
case glslang::EOpConstructInt64:
3320
case glslang::EOpConstructI64Vec2:
3321
case glslang::EOpConstructI64Vec3:
3322
case glslang::EOpConstructI64Vec4:
3323
case glslang::EOpConstructUint64:
3324
case glslang::EOpConstructU64Vec2:
3325
case glslang::EOpConstructU64Vec3:
3326
case glslang::EOpConstructU64Vec4:
3327
case glslang::EOpConstructStruct:
3328
case glslang::EOpConstructTextureSampler:
3329
case glslang::EOpConstructReference:
3330
case glslang::EOpConstructCooperativeMatrixNV:
3331
case glslang::EOpConstructCooperativeMatrixKHR:
3332
case glslang::EOpConstructCooperativeVectorNV:
3333
case glslang::EOpConstructSaturated:
3334
{
3335
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
3336
std::vector<spv::Id> arguments;
3337
translateArguments(*node, arguments, lvalueCoherentFlags);
3338
spv::Id constructed;
3339
if (node->getOp() == glslang::EOpConstructTextureSampler) {
3340
const glslang::TType& texType = node->getSequence()[0]->getAsTyped()->getType();
3341
if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6 &&
3342
texType.getSampler().isBuffer()) {
3343
// SamplerBuffer is not supported in spirv1.6 so
3344
// `samplerBuffer(textureBuffer, sampler)` is a no-op
3345
// and textureBuffer is the result going forward
3346
constructed = arguments[0];
3347
} else
3348
constructed = builder.createOp(spv::Op::OpSampledImage, resultType(), arguments);
3349
} else if (node->getOp() == glslang::EOpConstructCooperativeMatrixKHR &&
3350
node->getType().isCoopMatKHR() && node->getSequence()[0]->getAsTyped()->getType().isCoopMatKHR()) {
3351
builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
3352
builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
3353
constructed = builder.createCooperativeMatrixConversion(resultType(), arguments[0]);
3354
} else if (node->getOp() == glslang::EOpConstructCooperativeVectorNV &&
3355
arguments.size() == 1 &&
3356
builder.getTypeId(arguments[0]) == resultType()) {
3357
constructed = arguments[0];
3358
} else if (node->getOp() == glslang::EOpConstructStruct ||
3359
node->getOp() == glslang::EOpConstructCooperativeMatrixNV ||
3360
node->getOp() == glslang::EOpConstructCooperativeMatrixKHR ||
3361
node->getType().isArray() ||
3362
// Handle constructing coopvec from one component here, to avoid the component
3363
// getting smeared
3364
(node->getOp() == glslang::EOpConstructCooperativeVectorNV && arguments.size() == 1 && builder.isScalar(arguments[0]))) {
3365
std::vector<spv::Id> constituents;
3366
for (int c = 0; c < (int)arguments.size(); ++c)
3367
constituents.push_back(arguments[c]);
3368
constructed = createCompositeConstruct(resultType(), constituents);
3369
} else if (isMatrix)
3370
constructed = builder.createMatrixConstructor(precision, arguments, resultType());
3371
else if (node->getOp() == glslang::EOpConstructSaturated) {
3372
OpDecorations decorations = { TranslatePrecisionDecoration(node->getOperationPrecision()),
3373
TranslateNoContractionDecoration(node->getType().getQualifier()),
3374
TranslateNonUniformDecoration(lvalueCoherentFlags) };
3375
3376
constructed = createConversion(node->getOp(), decorations, resultType(), arguments[1],
3377
node->getType().getBasicType(), node->getSequence()[1]->getAsTyped()->getBasicType());
3378
builder.addDecoration(constructed, spv::Decoration::SaturatedToLargestFloat8NormalConversionEXT);
3379
builder.createStore(constructed, arguments[0]);
3380
}
3381
else
3382
constructed = builder.createConstructor(precision, arguments, resultType());
3383
3384
if (node->getType().getQualifier().isNonUniform()) {
3385
builder.addDecoration(constructed, spv::Decoration::NonUniformEXT);
3386
}
3387
3388
builder.clearAccessChain();
3389
builder.setAccessChainRValue(constructed);
3390
3391
return false;
3392
}
3393
3394
// These six are component-wise compares with component-wise results.
3395
// Forward on to createBinaryOperation(), requesting a vector result.
3396
case glslang::EOpLessThan:
3397
case glslang::EOpGreaterThan:
3398
case glslang::EOpLessThanEqual:
3399
case glslang::EOpGreaterThanEqual:
3400
case glslang::EOpVectorEqual:
3401
case glslang::EOpVectorNotEqual:
3402
{
3403
// Map the operation to a binary
3404
binOp = node->getOp();
3405
reduceComparison = false;
3406
switch (node->getOp()) {
3407
case glslang::EOpVectorEqual: binOp = glslang::EOpVectorEqual; break;
3408
case glslang::EOpVectorNotEqual: binOp = glslang::EOpVectorNotEqual; break;
3409
default: binOp = node->getOp(); break;
3410
}
3411
3412
break;
3413
}
3414
case glslang::EOpMul:
3415
// component-wise matrix multiply
3416
binOp = glslang::EOpMul;
3417
break;
3418
case glslang::EOpOuterProduct:
3419
// two vectors multiplied to make a matrix
3420
binOp = glslang::EOpOuterProduct;
3421
break;
3422
case glslang::EOpDot:
3423
{
3424
// for scalar dot product, use multiply
3425
glslang::TIntermSequence& glslangOperands = node->getSequence();
3426
if (glslangOperands[0]->getAsTyped()->getVectorSize() == 1)
3427
binOp = glslang::EOpMul;
3428
break;
3429
}
3430
case glslang::EOpMod:
3431
// when an aggregate, this is the floating-point mod built-in function,
3432
// which can be emitted by the one in createBinaryOperation()
3433
binOp = glslang::EOpMod;
3434
break;
3435
3436
case glslang::EOpEmitVertex:
3437
case glslang::EOpEndPrimitive:
3438
case glslang::EOpBarrier:
3439
case glslang::EOpMemoryBarrier:
3440
case glslang::EOpMemoryBarrierAtomicCounter:
3441
case glslang::EOpMemoryBarrierBuffer:
3442
case glslang::EOpMemoryBarrierImage:
3443
case glslang::EOpMemoryBarrierShared:
3444
case glslang::EOpGroupMemoryBarrier:
3445
case glslang::EOpDeviceMemoryBarrier:
3446
case glslang::EOpAllMemoryBarrierWithGroupSync:
3447
case glslang::EOpDeviceMemoryBarrierWithGroupSync:
3448
case glslang::EOpWorkgroupMemoryBarrier:
3449
case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:
3450
case glslang::EOpSubgroupBarrier:
3451
case glslang::EOpSubgroupMemoryBarrier:
3452
case glslang::EOpSubgroupMemoryBarrierBuffer:
3453
case glslang::EOpSubgroupMemoryBarrierImage:
3454
case glslang::EOpSubgroupMemoryBarrierShared:
3455
noReturnValue = true;
3456
// These all have 0 operands and will naturally finish up in the code below for 0 operands
3457
break;
3458
3459
case glslang::EOpAtomicAdd:
3460
case glslang::EOpAtomicSubtract:
3461
case glslang::EOpAtomicMin:
3462
case glslang::EOpAtomicMax:
3463
case glslang::EOpAtomicAnd:
3464
case glslang::EOpAtomicOr:
3465
case glslang::EOpAtomicXor:
3466
case glslang::EOpAtomicExchange:
3467
case glslang::EOpAtomicCompSwap:
3468
atomic = true;
3469
break;
3470
3471
case glslang::EOpAtomicStore:
3472
noReturnValue = true;
3473
[[fallthrough]];
3474
case glslang::EOpAtomicLoad:
3475
atomic = true;
3476
break;
3477
3478
case glslang::EOpAtomicCounterAdd:
3479
case glslang::EOpAtomicCounterSubtract:
3480
case glslang::EOpAtomicCounterMin:
3481
case glslang::EOpAtomicCounterMax:
3482
case glslang::EOpAtomicCounterAnd:
3483
case glslang::EOpAtomicCounterOr:
3484
case glslang::EOpAtomicCounterXor:
3485
case glslang::EOpAtomicCounterExchange:
3486
case glslang::EOpAtomicCounterCompSwap:
3487
builder.addExtension("SPV_KHR_shader_atomic_counter_ops");
3488
builder.addCapability(spv::Capability::AtomicStorageOps);
3489
atomic = true;
3490
break;
3491
3492
case glslang::EOpAbsDifference:
3493
case glslang::EOpAddSaturate:
3494
case glslang::EOpSubSaturate:
3495
case glslang::EOpAverage:
3496
case glslang::EOpAverageRounded:
3497
case glslang::EOpMul32x16:
3498
builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
3499
builder.addExtension("SPV_INTEL_shader_integer_functions2");
3500
binOp = node->getOp();
3501
break;
3502
3503
case glslang::EOpExpectEXT:
3504
builder.addCapability(spv::Capability::ExpectAssumeKHR);
3505
builder.addExtension(spv::E_SPV_KHR_expect_assume);
3506
binOp = node->getOp();
3507
break;
3508
3509
case glslang::EOpIgnoreIntersectionNV:
3510
case glslang::EOpTerminateRayNV:
3511
case glslang::EOpTraceNV:
3512
case glslang::EOpTraceRayMotionNV:
3513
case glslang::EOpTraceKHR:
3514
case glslang::EOpExecuteCallableNV:
3515
case glslang::EOpExecuteCallableKHR:
3516
case glslang::EOpWritePackedPrimitiveIndices4x8NV:
3517
case glslang::EOpEmitMeshTasksEXT:
3518
case glslang::EOpSetMeshOutputsEXT:
3519
noReturnValue = true;
3520
break;
3521
case glslang::EOpRayQueryInitialize:
3522
case glslang::EOpRayQueryTerminate:
3523
case glslang::EOpRayQueryGenerateIntersection:
3524
case glslang::EOpRayQueryConfirmIntersection:
3525
builder.addExtension("SPV_KHR_ray_query");
3526
builder.addCapability(spv::Capability::RayQueryKHR);
3527
noReturnValue = true;
3528
break;
3529
case glslang::EOpRayQueryProceed:
3530
case glslang::EOpRayQueryGetIntersectionType:
3531
case glslang::EOpRayQueryGetRayTMin:
3532
case glslang::EOpRayQueryGetRayFlags:
3533
case glslang::EOpRayQueryGetIntersectionT:
3534
case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
3535
case glslang::EOpRayQueryGetIntersectionInstanceId:
3536
case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
3537
case glslang::EOpRayQueryGetIntersectionGeometryIndex:
3538
case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
3539
case glslang::EOpRayQueryGetIntersectionBarycentrics:
3540
case glslang::EOpRayQueryGetIntersectionFrontFace:
3541
case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
3542
case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
3543
case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
3544
case glslang::EOpRayQueryGetWorldRayDirection:
3545
case glslang::EOpRayQueryGetWorldRayOrigin:
3546
case glslang::EOpRayQueryGetIntersectionObjectToWorld:
3547
case glslang::EOpRayQueryGetIntersectionWorldToObject:
3548
builder.addExtension("SPV_KHR_ray_query");
3549
builder.addCapability(spv::Capability::RayQueryKHR);
3550
break;
3551
case glslang::EOpCooperativeMatrixLoad:
3552
case glslang::EOpCooperativeMatrixStore:
3553
case glslang::EOpCooperativeMatrixLoadNV:
3554
case glslang::EOpCooperativeMatrixStoreNV:
3555
case glslang::EOpCooperativeMatrixLoadTensorNV:
3556
case glslang::EOpCooperativeMatrixStoreTensorNV:
3557
case glslang::EOpCooperativeMatrixReduceNV:
3558
case glslang::EOpCooperativeMatrixPerElementOpNV:
3559
case glslang::EOpCooperativeMatrixTransposeNV:
3560
case glslang::EOpCooperativeVectorMatMulNV:
3561
case glslang::EOpCooperativeVectorMatMulAddNV:
3562
case glslang::EOpCooperativeVectorLoadNV:
3563
case glslang::EOpCooperativeVectorStoreNV:
3564
case glslang::EOpCooperativeVectorOuterProductAccumulateNV:
3565
case glslang::EOpCooperativeVectorReduceSumAccumulateNV:
3566
noReturnValue = true;
3567
break;
3568
case glslang::EOpBeginInvocationInterlock:
3569
case glslang::EOpEndInvocationInterlock:
3570
builder.addExtension(spv::E_SPV_EXT_fragment_shader_interlock);
3571
noReturnValue = true;
3572
break;
3573
3574
case glslang::EOpHitObjectTraceRayNV:
3575
case glslang::EOpHitObjectTraceRayMotionNV:
3576
case glslang::EOpHitObjectGetAttributesNV:
3577
case glslang::EOpHitObjectExecuteShaderNV:
3578
case glslang::EOpHitObjectRecordEmptyNV:
3579
case glslang::EOpHitObjectRecordMissNV:
3580
case glslang::EOpHitObjectRecordMissMotionNV:
3581
case glslang::EOpHitObjectRecordHitNV:
3582
case glslang::EOpHitObjectRecordHitMotionNV:
3583
case glslang::EOpHitObjectRecordHitWithIndexNV:
3584
case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
3585
case glslang::EOpReorderThreadNV:
3586
noReturnValue = true;
3587
[[fallthrough]];
3588
case glslang::EOpHitObjectIsEmptyNV:
3589
case glslang::EOpHitObjectIsMissNV:
3590
case glslang::EOpHitObjectIsHitNV:
3591
case glslang::EOpHitObjectGetRayTMinNV:
3592
case glslang::EOpHitObjectGetRayTMaxNV:
3593
case glslang::EOpHitObjectGetObjectRayOriginNV:
3594
case glslang::EOpHitObjectGetObjectRayDirectionNV:
3595
case glslang::EOpHitObjectGetWorldRayOriginNV:
3596
case glslang::EOpHitObjectGetWorldRayDirectionNV:
3597
case glslang::EOpHitObjectGetObjectToWorldNV:
3598
case glslang::EOpHitObjectGetWorldToObjectNV:
3599
case glslang::EOpHitObjectGetInstanceCustomIndexNV:
3600
case glslang::EOpHitObjectGetInstanceIdNV:
3601
case glslang::EOpHitObjectGetGeometryIndexNV:
3602
case glslang::EOpHitObjectGetPrimitiveIndexNV:
3603
case glslang::EOpHitObjectGetHitKindNV:
3604
case glslang::EOpHitObjectGetCurrentTimeNV:
3605
case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
3606
case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
3607
builder.addExtension(spv::E_SPV_NV_shader_invocation_reorder);
3608
builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
3609
break;
3610
3611
case glslang::EOpHitObjectGetLSSPositionsNV:
3612
case glslang::EOpHitObjectGetLSSRadiiNV:
3613
builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
3614
builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
3615
builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
3616
noReturnValue = true;
3617
break;
3618
3619
case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
3620
case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
3621
builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
3622
builder.addCapability(spv::Capability::RayQueryKHR);
3623
builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
3624
noReturnValue = true;
3625
break;
3626
3627
case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
3628
case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
3629
case glslang::EOpRayQueryIsSphereHitNV:
3630
builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
3631
builder.addCapability(spv::Capability::RayQueryKHR);
3632
builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
3633
builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
3634
break;
3635
3636
case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
3637
case glslang::EOpRayQueryIsLSSHitNV:
3638
builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
3639
builder.addCapability(spv::Capability::RayQueryKHR);
3640
builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
3641
break;
3642
3643
case glslang::EOpHitObjectTraceRayEXT:
3644
case glslang::EOpHitObjectTraceRayMotionEXT:
3645
case glslang::EOpHitObjectGetAttributesEXT:
3646
case glslang::EOpHitObjectExecuteShaderEXT:
3647
case glslang::EOpHitObjectRecordEmptyEXT:
3648
case glslang::EOpHitObjectRecordMissEXT:
3649
case glslang::EOpHitObjectRecordMissMotionEXT:
3650
case glslang::EOpReorderThreadEXT:
3651
case glslang::EOpHitObjectSetShaderBindingTableRecordIndexEXT:
3652
case glslang::EOpHitObjectReorderExecuteEXT:
3653
case glslang::EOpHitObjectTraceReorderExecuteEXT:
3654
case glslang::EOpHitObjectTraceMotionReorderExecuteEXT:
3655
case glslang::EOpHitObjectRecordFromQueryEXT:
3656
case glslang::EOpHitObjectGetIntersectionTriangleVertexPositionsEXT:
3657
noReturnValue = true;
3658
[[fallthrough]];
3659
case glslang::EOpHitObjectIsEmptyEXT:
3660
case glslang::EOpHitObjectIsMissEXT:
3661
case glslang::EOpHitObjectIsHitEXT:
3662
case glslang::EOpHitObjectGetRayTMinEXT:
3663
case glslang::EOpHitObjectGetRayTMaxEXT:
3664
case glslang::EOpHitObjectGetRayFlagsEXT:
3665
case glslang::EOpHitObjectGetObjectRayOriginEXT:
3666
case glslang::EOpHitObjectGetObjectRayDirectionEXT:
3667
case glslang::EOpHitObjectGetWorldRayOriginEXT:
3668
case glslang::EOpHitObjectGetWorldRayDirectionEXT:
3669
case glslang::EOpHitObjectGetObjectToWorldEXT:
3670
case glslang::EOpHitObjectGetWorldToObjectEXT:
3671
case glslang::EOpHitObjectGetInstanceCustomIndexEXT:
3672
case glslang::EOpHitObjectGetInstanceIdEXT:
3673
case glslang::EOpHitObjectGetGeometryIndexEXT:
3674
case glslang::EOpHitObjectGetPrimitiveIndexEXT:
3675
case glslang::EOpHitObjectGetHitKindEXT:
3676
case glslang::EOpHitObjectGetCurrentTimeEXT:
3677
case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:
3678
case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:
3679
builder.addExtension(spv::E_SPV_EXT_shader_invocation_reorder);
3680
builder.addCapability(spv::Capability::ShaderInvocationReorderEXT);
3681
break;
3682
3683
case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
3684
builder.addExtension(spv::E_SPV_KHR_ray_tracing_position_fetch);
3685
builder.addCapability(spv::Capability::RayQueryPositionFetchKHR);
3686
noReturnValue = true;
3687
break;
3688
case glslang::EOpImageSampleWeightedQCOM:
3689
builder.addCapability(spv::Capability::TextureSampleWeightedQCOM);
3690
builder.addExtension(spv::E_SPV_QCOM_image_processing);
3691
break;
3692
case glslang::EOpImageBoxFilterQCOM:
3693
builder.addCapability(spv::Capability::TextureBoxFilterQCOM);
3694
builder.addExtension(spv::E_SPV_QCOM_image_processing);
3695
break;
3696
case glslang::EOpImageBlockMatchSADQCOM:
3697
case glslang::EOpImageBlockMatchSSDQCOM:
3698
builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
3699
builder.addExtension(spv::E_SPV_QCOM_image_processing);
3700
break;
3701
case glslang::EOpTensorWriteARM:
3702
noReturnValue = true;
3703
break;
3704
3705
case glslang::EOpImageBlockMatchWindowSSDQCOM:
3706
case glslang::EOpImageBlockMatchWindowSADQCOM:
3707
builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
3708
builder.addExtension(spv::E_SPV_QCOM_image_processing);
3709
builder.addCapability(spv::Capability::TextureBlockMatch2QCOM);
3710
builder.addExtension(spv::E_SPV_QCOM_image_processing2);
3711
break;
3712
3713
case glslang::EOpImageBlockMatchGatherSSDQCOM:
3714
case glslang::EOpImageBlockMatchGatherSADQCOM:
3715
builder.addCapability(spv::Capability::TextureBlockMatchQCOM);
3716
builder.addExtension(spv::E_SPV_QCOM_image_processing);
3717
builder.addCapability(spv::Capability::TextureBlockMatch2QCOM);
3718
builder.addExtension(spv::E_SPV_QCOM_image_processing2);
3719
break;
3720
3721
case glslang::EOpFetchMicroTriangleVertexPositionNV:
3722
case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
3723
builder.addExtension(spv::E_SPV_NV_displacement_micromap);
3724
builder.addCapability(spv::Capability::DisplacementMicromapNV);
3725
break;
3726
3727
case glslang::EOpRayQueryGetIntersectionClusterIdNV:
3728
builder.addExtension(spv::E_SPV_NV_cluster_acceleration_structure);
3729
builder.addCapability(spv::Capability::RayQueryKHR);
3730
builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
3731
break;
3732
3733
case glslang::EOpDebugPrintf:
3734
noReturnValue = true;
3735
break;
3736
3737
default:
3738
break;
3739
}
3740
3741
//
3742
// See if it maps to a regular operation.
3743
//
3744
if (binOp != glslang::EOpNull) {
3745
glslang::TIntermTyped* left = node->getSequence()[0]->getAsTyped();
3746
glslang::TIntermTyped* right = node->getSequence()[1]->getAsTyped();
3747
assert(left && right);
3748
3749
builder.clearAccessChain();
3750
left->traverse(this);
3751
spv::Id leftId = accessChainLoad(left->getType());
3752
3753
builder.clearAccessChain();
3754
right->traverse(this);
3755
spv::Id rightId = accessChainLoad(right->getType());
3756
3757
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
3758
OpDecorations decorations = { precision,
3759
TranslateNoContractionDecoration(node->getType().getQualifier()),
3760
TranslateNonUniformDecoration(node->getType().getQualifier()) };
3761
result = createBinaryOperation(binOp, decorations,
3762
resultType(), leftId, rightId,
3763
left->getType().getBasicType(), reduceComparison);
3764
3765
// code above should only make binOp that exists in createBinaryOperation
3766
assert(result != spv::NoResult);
3767
builder.clearAccessChain();
3768
builder.setAccessChainRValue(result);
3769
3770
return false;
3771
}
3772
3773
//
3774
// Create the list of operands.
3775
//
3776
glslang::TIntermSequence& glslangOperands = node->getSequence();
3777
std::vector<spv::Id> operands;
3778
std::vector<spv::IdImmediate> memoryAccessOperands;
3779
for (int arg = 0; arg < (int)glslangOperands.size(); ++arg) {
3780
// special case l-value operands; there are just a few
3781
bool lvalue = false;
3782
switch (node->getOp()) {
3783
case glslang::EOpModf:
3784
if (arg == 1)
3785
lvalue = true;
3786
break;
3787
3788
3789
3790
case glslang::EOpHitObjectRecordFromQueryEXT:
3791
case glslang::EOpHitObjectGetIntersectionTriangleVertexPositionsEXT:
3792
if (arg == 0 || arg == 1)
3793
lvalue = true;
3794
break;
3795
3796
case glslang::EOpHitObjectRecordHitNV:
3797
case glslang::EOpHitObjectRecordHitMotionNV:
3798
case glslang::EOpHitObjectRecordHitWithIndexNV:
3799
case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
3800
case glslang::EOpHitObjectTraceRayNV:
3801
case glslang::EOpHitObjectTraceRayMotionNV:
3802
case glslang::EOpHitObjectExecuteShaderNV:
3803
case glslang::EOpHitObjectRecordMissNV:
3804
case glslang::EOpHitObjectRecordMissMotionNV:
3805
case glslang::EOpHitObjectGetAttributesNV:
3806
case glslang::EOpHitObjectGetClusterIdNV:
3807
case glslang::EOpHitObjectTraceRayEXT:
3808
case glslang::EOpHitObjectTraceRayMotionEXT:
3809
case glslang::EOpHitObjectExecuteShaderEXT:
3810
case glslang::EOpHitObjectRecordMissEXT:
3811
case glslang::EOpHitObjectRecordMissMotionEXT:
3812
case glslang::EOpHitObjectGetAttributesEXT:
3813
case glslang::EOpHitObjectSetShaderBindingTableRecordIndexEXT:
3814
case glslang::EOpHitObjectReorderExecuteEXT:
3815
case glslang::EOpHitObjectTraceReorderExecuteEXT:
3816
case glslang::EOpHitObjectTraceMotionReorderExecuteEXT:
3817
if (arg == 0)
3818
lvalue = true;
3819
break;
3820
3821
case glslang::EOpHitObjectGetLSSPositionsNV:
3822
case glslang::EOpHitObjectGetLSSRadiiNV:
3823
lvalue = true;
3824
break;
3825
3826
case glslang::EOpRayQueryInitialize:
3827
case glslang::EOpRayQueryTerminate:
3828
case glslang::EOpRayQueryConfirmIntersection:
3829
case glslang::EOpRayQueryProceed:
3830
case glslang::EOpRayQueryGenerateIntersection:
3831
case glslang::EOpRayQueryGetIntersectionType:
3832
case glslang::EOpRayQueryGetIntersectionT:
3833
case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
3834
case glslang::EOpRayQueryGetIntersectionInstanceId:
3835
case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
3836
case glslang::EOpRayQueryGetIntersectionGeometryIndex:
3837
case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
3838
case glslang::EOpRayQueryGetIntersectionBarycentrics:
3839
case glslang::EOpRayQueryGetIntersectionFrontFace:
3840
case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
3841
case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
3842
case glslang::EOpRayQueryGetIntersectionObjectToWorld:
3843
case glslang::EOpRayQueryGetIntersectionWorldToObject:
3844
case glslang::EOpRayQueryGetIntersectionClusterIdNV:
3845
case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
3846
case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
3847
case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
3848
case glslang::EOpRayQueryIsSphereHitNV:
3849
case glslang::EOpRayQueryIsLSSHitNV:
3850
if (arg == 0)
3851
lvalue = true;
3852
break;
3853
3854
case glslang::EOpAtomicAdd:
3855
case glslang::EOpAtomicSubtract:
3856
case glslang::EOpAtomicMin:
3857
case glslang::EOpAtomicMax:
3858
case glslang::EOpAtomicAnd:
3859
case glslang::EOpAtomicOr:
3860
case glslang::EOpAtomicXor:
3861
case glslang::EOpAtomicExchange:
3862
case glslang::EOpAtomicCompSwap:
3863
if (arg == 0)
3864
lvalue = true;
3865
break;
3866
3867
case glslang::EOpFrexp:
3868
if (arg == 1)
3869
lvalue = true;
3870
break;
3871
case glslang::EOpInterpolateAtSample:
3872
case glslang::EOpInterpolateAtOffset:
3873
case glslang::EOpInterpolateAtVertex:
3874
if (arg == 0) {
3875
// If GLSL, use the address of the interpolant argument.
3876
// If HLSL, use an internal version of OpInterolates that takes
3877
// the rvalue of the interpolant. A fixup pass in spirv-opt
3878
// legalization will remove the OpLoad and convert to an lvalue.
3879
// Had to do this because legalization will only propagate a
3880
// builtin into an rvalue.
3881
lvalue = glslangIntermediate->getSource() != glslang::EShSourceHlsl;
3882
3883
// Does it need a swizzle inversion? If so, evaluation is inverted;
3884
// operate first on the swizzle base, then apply the swizzle.
3885
// That is, we transform
3886
//
3887
// interpolate(v.zy) -> interpolate(v).zy
3888
//
3889
if (glslangOperands[0]->getAsOperator() &&
3890
glslangOperands[0]->getAsOperator()->getOp() == glslang::EOpVectorSwizzle)
3891
invertedType = convertGlslangToSpvType(
3892
glslangOperands[0]->getAsBinaryNode()->getLeft()->getType());
3893
}
3894
break;
3895
case glslang::EOpAtomicLoad:
3896
case glslang::EOpAtomicStore:
3897
case glslang::EOpAtomicCounterAdd:
3898
case glslang::EOpAtomicCounterSubtract:
3899
case glslang::EOpAtomicCounterMin:
3900
case glslang::EOpAtomicCounterMax:
3901
case glslang::EOpAtomicCounterAnd:
3902
case glslang::EOpAtomicCounterOr:
3903
case glslang::EOpAtomicCounterXor:
3904
case glslang::EOpAtomicCounterExchange:
3905
case glslang::EOpAtomicCounterCompSwap:
3906
if (arg == 0)
3907
lvalue = true;
3908
break;
3909
case glslang::EOpAddCarry:
3910
case glslang::EOpSubBorrow:
3911
if (arg == 2)
3912
lvalue = true;
3913
break;
3914
case glslang::EOpUMulExtended:
3915
case glslang::EOpIMulExtended:
3916
if (arg >= 2)
3917
lvalue = true;
3918
break;
3919
case glslang::EOpCooperativeMatrixLoad:
3920
case glslang::EOpCooperativeMatrixLoadNV:
3921
case glslang::EOpCooperativeMatrixLoadTensorNV:
3922
case glslang::EOpCooperativeVectorLoadNV:
3923
if (arg == 0 || arg == 1)
3924
lvalue = true;
3925
break;
3926
case glslang::EOpCooperativeMatrixStore:
3927
case glslang::EOpCooperativeMatrixStoreNV:
3928
case glslang::EOpCooperativeMatrixStoreTensorNV:
3929
case glslang::EOpCooperativeVectorStoreNV:
3930
if (arg == 1)
3931
lvalue = true;
3932
break;
3933
case glslang::EOpCooperativeVectorMatMulNV:
3934
if (arg == 0 || arg == 3)
3935
lvalue = true;
3936
break;
3937
case glslang::EOpCooperativeVectorMatMulAddNV:
3938
if (arg == 0 || arg == 3 || arg == 6)
3939
lvalue = true;
3940
break;
3941
case glslang::EOpCooperativeVectorOuterProductAccumulateNV:
3942
if (arg == 2)
3943
lvalue = true;
3944
break;
3945
case glslang::EOpCooperativeVectorReduceSumAccumulateNV:
3946
if (arg == 1)
3947
lvalue = true;
3948
break;
3949
case glslang::EOpCooperativeMatrixReduceNV:
3950
case glslang::EOpCooperativeMatrixPerElementOpNV:
3951
case glslang::EOpCooperativeMatrixTransposeNV:
3952
if (arg == 0)
3953
lvalue = true;
3954
break;
3955
case glslang::EOpSpirvInst:
3956
if (glslangOperands[arg]->getAsTyped()->getQualifier().isSpirvByReference())
3957
lvalue = true;
3958
break;
3959
case glslang::EOpReorderThreadNV:
3960
case glslang::EOpReorderThreadEXT:
3961
//Three variants of reorderThreadNV, two of them use hitObjectNV
3962
if (arg == 0 && glslangOperands.size() != 2)
3963
lvalue = true;
3964
break;
3965
case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
3966
case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
3967
case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
3968
if (arg == 0 || arg == 2)
3969
lvalue = true;
3970
break;
3971
case glslang::EOpTensorReadARM:
3972
if (arg == 2)
3973
lvalue = true;
3974
break;
3975
default:
3976
break;
3977
}
3978
builder.clearAccessChain();
3979
if (invertedType != spv::NoType && arg == 0)
3980
glslangOperands[0]->getAsBinaryNode()->getLeft()->traverse(this);
3981
else
3982
glslangOperands[arg]->traverse(this);
3983
3984
bool isCoopMat = node->getOp() == glslang::EOpCooperativeMatrixLoad ||
3985
node->getOp() == glslang::EOpCooperativeMatrixStore ||
3986
node->getOp() == glslang::EOpCooperativeMatrixLoadNV ||
3987
node->getOp() == glslang::EOpCooperativeMatrixStoreNV ||
3988
node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV ||
3989
node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV;
3990
bool isCoopVec = node->getOp() == glslang::EOpCooperativeVectorLoadNV ||
3991
node->getOp() == glslang::EOpCooperativeVectorStoreNV;
3992
if (isCoopMat || isCoopVec) {
3993
3994
if (arg == 1) {
3995
spv::Builder::AccessChain::CoherentFlags coherentFlags {};
3996
unsigned int alignment {};
3997
if (isCoopMat) {
3998
// fold "element" parameter into the access chain
3999
spv::Builder::AccessChain save = builder.getAccessChain();
4000
builder.clearAccessChain();
4001
glslangOperands[2]->traverse(this);
4002
4003
spv::Id elementId = accessChainLoad(glslangOperands[2]->getAsTyped()->getType());
4004
4005
builder.setAccessChain(save);
4006
4007
// Point to the first element of the array.
4008
builder.accessChainPush(elementId,
4009
TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType()),
4010
glslangOperands[arg]->getAsTyped()->getType().getBufferReferenceAlignment());
4011
coherentFlags = builder.getAccessChain().coherentFlags;
4012
alignment = builder.getAccessChain().alignment;
4013
} else {
4014
coherentFlags = builder.getAccessChain().coherentFlags;
4015
coherentFlags |= TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType());
4016
alignment = 16;
4017
}
4018
4019
spv::MemoryAccessMask memoryAccess = TranslateMemoryAccess(coherentFlags);
4020
if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||
4021
node->getOp() == glslang::EOpCooperativeMatrixLoadNV ||
4022
node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV ||
4023
node->getOp() == glslang::EOpCooperativeVectorLoadNV)
4024
memoryAccess = (memoryAccess & ~spv::MemoryAccessMask::MakePointerAvailableKHR);
4025
if (node->getOp() == glslang::EOpCooperativeMatrixStore ||
4026
node->getOp() == glslang::EOpCooperativeMatrixStoreNV ||
4027
node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV ||
4028
node->getOp() == glslang::EOpCooperativeVectorStoreNV)
4029
memoryAccess = (memoryAccess & ~spv::MemoryAccessMask::MakePointerVisibleKHR);
4030
if (builder.getStorageClass(builder.getAccessChain().base) ==
4031
spv::StorageClass::PhysicalStorageBufferEXT) {
4032
memoryAccess = (spv::MemoryAccessMask)(memoryAccess | spv::MemoryAccessMask::Aligned);
4033
}
4034
4035
memoryAccessOperands.push_back(spv::IdImmediate(false, memoryAccess));
4036
4037
if (anySet(memoryAccess, spv::MemoryAccessMask::Aligned)) {
4038
memoryAccessOperands.push_back(spv::IdImmediate(false, alignment));
4039
}
4040
4041
if (anySet(memoryAccess,
4042
spv::MemoryAccessMask::MakePointerAvailableKHR | spv::MemoryAccessMask::MakePointerVisibleKHR)) {
4043
memoryAccessOperands.push_back(spv::IdImmediate(true,
4044
builder.makeUintConstant(TranslateMemoryScope(coherentFlags))));
4045
}
4046
} else if (isCoopMat && arg == 2) {
4047
continue;
4048
}
4049
}
4050
4051
// for l-values, pass the address, for r-values, pass the value
4052
if (lvalue) {
4053
if (invertedType == spv::NoType && !builder.isSpvLvalue()) {
4054
// SPIR-V cannot represent an l-value containing a swizzle that doesn't
4055
// reduce to a simple access chain. So, we need a temporary vector to
4056
// receive the result, and must later swizzle that into the original
4057
// l-value.
4058
complexLvalues.push_back(builder.getAccessChain());
4059
temporaryLvalues.push_back(builder.createVariable(
4060
spv::NoPrecision, spv::StorageClass::Function,
4061
builder.accessChainGetInferredType(), "swizzleTemp"));
4062
operands.push_back(temporaryLvalues.back());
4063
} else {
4064
operands.push_back(builder.accessChainGetLValue());
4065
}
4066
lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
4067
lvalueCoherentFlags |= TranslateCoherent(glslangOperands[arg]->getAsTyped()->getType());
4068
} else {
4069
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
4070
glslang::TOperator glslangOp = node->getOp();
4071
if (arg == 1 &&
4072
(glslangOp == glslang::EOpRayQueryGetIntersectionType ||
4073
glslangOp == glslang::EOpRayQueryGetIntersectionT ||
4074
glslangOp == glslang::EOpRayQueryGetIntersectionInstanceCustomIndex ||
4075
glslangOp == glslang::EOpRayQueryGetIntersectionInstanceId ||
4076
glslangOp == glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset ||
4077
glslangOp == glslang::EOpRayQueryGetIntersectionGeometryIndex ||
4078
glslangOp == glslang::EOpRayQueryGetIntersectionPrimitiveIndex ||
4079
glslangOp == glslang::EOpRayQueryGetIntersectionBarycentrics ||
4080
glslangOp == glslang::EOpRayQueryGetIntersectionFrontFace ||
4081
glslangOp == glslang::EOpRayQueryGetIntersectionObjectRayDirection ||
4082
glslangOp == glslang::EOpRayQueryGetIntersectionObjectRayOrigin ||
4083
glslangOp == glslang::EOpRayQueryGetIntersectionObjectToWorld ||
4084
glslangOp == glslang::EOpRayQueryGetIntersectionWorldToObject ||
4085
glslangOp == glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT ||
4086
glslangOp == glslang::EOpRayQueryGetIntersectionClusterIdNV ||
4087
glslangOp == glslang::EOpRayQueryGetIntersectionSpherePositionNV ||
4088
glslangOp == glslang::EOpRayQueryGetIntersectionSphereRadiusNV ||
4089
glslangOp == glslang::EOpRayQueryGetIntersectionLSSHitValueNV ||
4090
glslangOp == glslang::EOpRayQueryGetIntersectionLSSPositionsNV ||
4091
glslangOp == glslang::EOpRayQueryGetIntersectionLSSRadiiNV ||
4092
glslangOp == glslang::EOpRayQueryIsLSSHitNV ||
4093
glslangOp == glslang::EOpRayQueryIsSphereHitNV
4094
)) {
4095
bool cond = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getBConst();
4096
operands.push_back(builder.makeIntConstant(cond ? 1 : 0));
4097
} else if ((arg == 10 && glslangOp == glslang::EOpTraceKHR) ||
4098
(arg == 11 && glslangOp == glslang::EOpTraceRayMotionNV) ||
4099
(arg == 1 && glslangOp == glslang::EOpExecuteCallableKHR) ||
4100
(arg == 1 && glslangOp == glslang::EOpHitObjectExecuteShaderNV) ||
4101
(arg == 1 && glslangOp == glslang::EOpHitObjectExecuteShaderEXT) ||
4102
(arg == 11 && glslangOp == glslang::EOpHitObjectTraceRayNV) ||
4103
(arg == 11 && glslangOp == glslang::EOpHitObjectTraceRayEXT) ||
4104
(arg == 12 && glslangOp == glslang::EOpHitObjectTraceRayMotionNV) ||
4105
(arg == 12 && glslangOp == glslang::EOpHitObjectTraceRayMotionEXT) ||
4106
(arg == 12 && glslangOp == glslang::EOpHitObjectTraceMotionReorderExecuteEXT && glslangOperands.size() == 13) ||
4107
(arg == 14 && glslangOp == glslang::EOpHitObjectTraceMotionReorderExecuteEXT && glslangOperands.size() == 15) ||
4108
(arg == 11 && glslangOp == glslang::EOpHitObjectTraceReorderExecuteEXT && glslangOperands.size() == 12) ||
4109
(arg == 13 && glslangOp == glslang::EOpHitObjectTraceReorderExecuteEXT && glslangOperands.size() == 14) ||
4110
(arg == 1 && glslangOp == glslang::EOpHitObjectReorderExecuteEXT && glslangOperands.size() == 2) ||
4111
(arg == 3 && glslangOp == glslang::EOpHitObjectReorderExecuteEXT && glslangOperands.size() == 4)) {
4112
const int set = glslangOp == glslang::EOpExecuteCallableKHR ? 1 : 0;
4113
const int location = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getUConst();
4114
auto itNode = locationToSymbol[set].find(location);
4115
visitSymbol(itNode->second);
4116
spv::Id symId = getSymbolId(itNode->second);
4117
operands.push_back(symId);
4118
} else if ((arg == 12 && glslangOp == glslang::EOpHitObjectRecordHitNV) ||
4119
(arg == 13 && glslangOp == glslang::EOpHitObjectRecordHitMotionNV) ||
4120
(arg == 11 && glslangOp == glslang::EOpHitObjectRecordHitWithIndexNV) ||
4121
(arg == 12 && glslangOp == glslang::EOpHitObjectRecordHitWithIndexMotionNV) ||
4122
(arg == 3 && glslangOp == glslang::EOpHitObjectRecordFromQueryEXT) ||
4123
(arg == 1 && glslangOp == glslang::EOpHitObjectGetAttributesEXT) ||
4124
(arg == 1 && glslangOp == glslang::EOpHitObjectGetAttributesNV)) {
4125
const int location = glslangOperands[arg]->getAsConstantUnion()->getConstArray()[0].getUConst();
4126
const int set = 2;
4127
auto itNode = locationToSymbol[set].find(location);
4128
visitSymbol(itNode->second);
4129
spv::Id symId = getSymbolId(itNode->second);
4130
operands.push_back(symId);
4131
} else if (glslangOperands[arg]->getAsTyped()->getQualifier().isSpirvLiteral()) {
4132
// Will be translated to a literal value, make a placeholder here
4133
operands.push_back(spv::NoResult);
4134
} else if (glslangOperands[arg]->getAsTyped()->getBasicType() == glslang::EbtFunction) {
4135
spv::Function* function = functionMap[glslangOperands[arg]->getAsSymbolNode()->getMangledName().c_str()];
4136
assert(function);
4137
operands.push_back(function->getId());
4138
} else {
4139
operands.push_back(accessChainLoad(glslangOperands[arg]->getAsTyped()->getType()));
4140
}
4141
}
4142
}
4143
4144
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
4145
if (node->getOp() == glslang::EOpCooperativeMatrixLoadTensorNV) {
4146
std::vector<spv::IdImmediate> idImmOps;
4147
4148
builder.addCapability(spv::Capability::CooperativeMatrixTensorAddressingNV);
4149
builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
4150
4151
spv::Id object = builder.createLoad(operands[0], spv::NoPrecision);
4152
4153
idImmOps.push_back(spv::IdImmediate(true, operands[1])); // Pointer
4154
idImmOps.push_back(spv::IdImmediate(true, object)); // Object
4155
idImmOps.push_back(spv::IdImmediate(true, operands[2])); // tensorLayout
4156
4157
idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end()); // memoryaccess
4158
4159
// initialize tensor operands to zero, then OR in flags based on the operands
4160
size_t tensorOpIdx = idImmOps.size();
4161
idImmOps.push_back(spv::IdImmediate(false, 0));
4162
4163
for (uint32_t i = 3; i < operands.size(); ++i) {
4164
if (builder.isTensorView(operands[i])) {
4165
addMask(idImmOps[tensorOpIdx].word, spv::TensorAddressingOperandsMask::TensorView);
4166
} else {
4167
// must be the decode func
4168
addMask(idImmOps[tensorOpIdx].word, spv::TensorAddressingOperandsMask::DecodeFunc);
4169
builder.addCapability(spv::Capability::CooperativeMatrixBlockLoadsNV);
4170
}
4171
idImmOps.push_back(spv::IdImmediate(true, operands[i])); // tensorView or decodeFunc
4172
}
4173
4174
// get the pointee type
4175
spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
4176
assert(builder.isCooperativeMatrixType(typeId));
4177
// do the op
4178
spv::Id result = builder.createOp(spv::Op::OpCooperativeMatrixLoadTensorNV, typeId, idImmOps);
4179
// store the result to the pointer (out param 'm')
4180
builder.createStore(result, operands[0]);
4181
result = 0;
4182
} else if (node->getOp() == glslang::EOpCooperativeMatrixLoad ||
4183
node->getOp() == glslang::EOpCooperativeMatrixLoadNV) {
4184
std::vector<spv::IdImmediate> idImmOps;
4185
4186
idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
4187
if (node->getOp() == glslang::EOpCooperativeMatrixLoad) {
4188
idImmOps.push_back(spv::IdImmediate(true, operands[3])); // matrixLayout
4189
auto layout = (spv::CooperativeMatrixLayout)builder.getConstantScalar(operands[3]);
4190
if (layout == spv::CooperativeMatrixLayout::RowBlockedInterleavedARM ||
4191
layout == spv::CooperativeMatrixLayout::ColumnBlockedInterleavedARM) {
4192
builder.addExtension(spv::E_SPV_ARM_cooperative_matrix_layouts);
4193
builder.addCapability(spv::Capability::CooperativeMatrixLayoutsARM);
4194
}
4195
idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
4196
} else {
4197
idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
4198
idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor
4199
}
4200
idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
4201
// get the pointee type
4202
spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
4203
assert(builder.isCooperativeMatrixType(typeId));
4204
// do the op
4205
spv::Id result = node->getOp() == glslang::EOpCooperativeMatrixLoad
4206
? builder.createOp(spv::Op::OpCooperativeMatrixLoadKHR, typeId, idImmOps)
4207
: builder.createOp(spv::Op::OpCooperativeMatrixLoadNV, typeId, idImmOps);
4208
// store the result to the pointer (out param 'm')
4209
builder.createStore(result, operands[0]);
4210
result = 0;
4211
} else if (node->getOp() == glslang::EOpCooperativeMatrixStoreTensorNV) {
4212
std::vector<spv::IdImmediate> idImmOps;
4213
4214
idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
4215
idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
4216
4217
builder.addCapability(spv::Capability::CooperativeMatrixTensorAddressingNV);
4218
builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
4219
4220
idImmOps.push_back(spv::IdImmediate(true, operands[2])); // tensorLayout
4221
4222
idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end()); // memoryaccess
4223
4224
if (operands.size() > 3) {
4225
idImmOps.push_back(spv::IdImmediate(false, spv::TensorAddressingOperandsMask::TensorView));
4226
idImmOps.push_back(spv::IdImmediate(true, operands[3])); // tensorView
4227
} else {
4228
idImmOps.push_back(spv::IdImmediate(false, 0));
4229
}
4230
4231
builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreTensorNV, idImmOps);
4232
result = 0;
4233
} else if (node->getOp() == glslang::EOpCooperativeMatrixStore ||
4234
node->getOp() == glslang::EOpCooperativeMatrixStoreNV) {
4235
std::vector<spv::IdImmediate> idImmOps;
4236
4237
idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
4238
idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
4239
if (node->getOp() == glslang::EOpCooperativeMatrixStore) {
4240
idImmOps.push_back(spv::IdImmediate(true, operands[3])); // matrixLayout
4241
auto layout = (spv::CooperativeMatrixLayout)builder.getConstantScalar(operands[3]);
4242
if (layout == spv::CooperativeMatrixLayout::RowBlockedInterleavedARM ||
4243
layout == spv::CooperativeMatrixLayout::ColumnBlockedInterleavedARM) {
4244
builder.addExtension(spv::E_SPV_ARM_cooperative_matrix_layouts);
4245
builder.addCapability(spv::Capability::CooperativeMatrixLayoutsARM);
4246
}
4247
idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
4248
} else {
4249
idImmOps.push_back(spv::IdImmediate(true, operands[2])); // stride
4250
idImmOps.push_back(spv::IdImmediate(true, operands[3])); // colMajor
4251
}
4252
idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
4253
4254
if (node->getOp() == glslang::EOpCooperativeMatrixStore)
4255
builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreKHR, idImmOps);
4256
else
4257
builder.createNoResultOp(spv::Op::OpCooperativeMatrixStoreNV, idImmOps);
4258
result = 0;
4259
} else if (node->getOp() == glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT) {
4260
std::vector<spv::IdImmediate> idImmOps;
4261
4262
idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
4263
idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
4264
4265
spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
4266
builder.makeUintConstant(3), 0);
4267
// do the op
4268
4269
spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionTriangleVertexPositionsKHR;
4270
4271
spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
4272
// store the result to the pointer (out param 'm')
4273
builder.createStore(result, operands[2]);
4274
result = 0;
4275
} else if (node->getOp() == glslang::EOpRayQueryGetIntersectionLSSPositionsNV) {
4276
std::vector<spv::IdImmediate> idImmOps;
4277
4278
idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
4279
idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
4280
4281
spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
4282
builder.makeUintConstant(2), 0);
4283
// do the op
4284
4285
spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionLSSPositionsNV;
4286
4287
spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
4288
// store the result to the pointer (out param 'm')
4289
builder.createStore(result, operands[2]);
4290
result = 0;
4291
} else if (node->getOp() == glslang::EOpRayQueryGetIntersectionLSSRadiiNV) {
4292
std::vector<spv::IdImmediate> idImmOps;
4293
4294
idImmOps.push_back(spv::IdImmediate(true, operands[0])); // q
4295
idImmOps.push_back(spv::IdImmediate(true, operands[1])); // committed
4296
4297
spv::Id typeId = builder.makeArrayType(builder.makeFloatType(32),
4298
builder.makeUintConstant(2), 0);
4299
// do the op
4300
4301
spv::Op spvOp = spv::Op::OpRayQueryGetIntersectionLSSRadiiNV;
4302
4303
spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
4304
// store the result to the pointer (out param 'm')
4305
builder.createStore(result, operands[2]);
4306
result = 0;
4307
} else if (node->getOp() == glslang::EOpHitObjectGetLSSPositionsNV) {
4308
std::vector<spv::IdImmediate> idImmOps;
4309
4310
idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
4311
4312
spv::Op spvOp = spv::Op::OpHitObjectGetLSSPositionsNV;
4313
spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
4314
builder.makeUintConstant(2), 0);
4315
4316
spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
4317
// store the result to the pointer (out param 'm')
4318
builder.createStore(result, operands[1]);
4319
result = 0;
4320
} else if (node->getOp() == glslang::EOpHitObjectGetLSSRadiiNV) {
4321
std::vector<spv::IdImmediate> idImmOps;
4322
4323
idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
4324
4325
spv::Op spvOp = spv::Op::OpHitObjectGetLSSRadiiNV;
4326
spv::Id typeId = builder.makeArrayType(builder.makeFloatType(32),
4327
builder.makeUintConstant(2), 0);
4328
4329
spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
4330
// store the result to the pointer (out param 'm')
4331
builder.createStore(result, operands[1]);
4332
result = 0;
4333
} else if (node->getOp() == glslang::EOpHitObjectGetIntersectionTriangleVertexPositionsEXT) {
4334
std::vector<spv::IdImmediate> idImmOps;
4335
4336
idImmOps.push_back(spv::IdImmediate(true, operands[0])); // hitObject
4337
4338
spv::Op spvOp = spv::Op::OpHitObjectGetIntersectionTriangleVertexPositionsEXT;
4339
spv::Id typeId = builder.makeArrayType(builder.makeVectorType(builder.makeFloatType(32), 3),
4340
builder.makeUintConstant(3), 0);
4341
4342
spv::Id result = builder.createOp(spvOp, typeId, idImmOps);
4343
// store the result to the pointer (out param 'm')
4344
builder.createStore(result, operands[1]);
4345
result = 0;
4346
} else if (node->getOp() == glslang::EOpCooperativeMatrixMulAdd) {
4347
auto matrixOperands = spv::CooperativeMatrixOperandsMask::MaskNone;
4348
4349
// If the optional operand is present, initialize matrixOperands to that value.
4350
if (glslangOperands.size() == 4 && glslangOperands[3]->getAsConstantUnion()) {
4351
matrixOperands = (spv::CooperativeMatrixOperandsMask)glslangOperands[3]->getAsConstantUnion()->getConstArray()[0].getIConst();
4352
}
4353
4354
// Determine Cooperative Matrix Operands bits from the signedness of the types.
4355
if (isTypeSignedInt(glslangOperands[0]->getAsTyped()->getBasicType()))
4356
addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixASignedComponentsKHR);
4357
if (isTypeSignedInt(glslangOperands[1]->getAsTyped()->getBasicType()))
4358
addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixBSignedComponentsKHR);
4359
if (isTypeSignedInt(glslangOperands[2]->getAsTyped()->getBasicType()))
4360
addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixCSignedComponentsKHR);
4361
if (isTypeSignedInt(node->getBasicType()))
4362
addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixResultSignedComponentsKHR);
4363
4364
std::vector<spv::IdImmediate> idImmOps;
4365
idImmOps.push_back(spv::IdImmediate(true, operands[0]));
4366
idImmOps.push_back(spv::IdImmediate(true, operands[1]));
4367
idImmOps.push_back(spv::IdImmediate(true, operands[2]));
4368
if (matrixOperands != spv::CooperativeMatrixOperandsMask::MaskNone)
4369
idImmOps.push_back(spv::IdImmediate(false, matrixOperands));
4370
4371
result = builder.createOp(spv::Op::OpCooperativeMatrixMulAddKHR, resultType(), idImmOps);
4372
} else if (node->getOp() == glslang::EOpCooperativeMatrixReduceNV) {
4373
builder.addCapability(spv::Capability::CooperativeMatrixReductionsNV);
4374
builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
4375
4376
spv::Op opcode = spv::Op::OpCooperativeMatrixReduceNV;
4377
unsigned mask = glslangOperands[2]->getAsConstantUnion()->getConstArray()[0].getUConst();
4378
4379
spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
4380
assert(builder.isCooperativeMatrixType(typeId));
4381
4382
result = builder.createCooperativeMatrixReduce(opcode, typeId, operands[1], mask, operands[3]);
4383
// store the result to the pointer (out param 'm')
4384
builder.createStore(result, operands[0]);
4385
result = 0;
4386
} else if (node->getOp() == glslang::EOpCooperativeMatrixPerElementOpNV) {
4387
builder.addCapability(spv::Capability::CooperativeMatrixPerElementOperationsNV);
4388
builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
4389
4390
spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
4391
assert(builder.isCooperativeMatrixType(typeId));
4392
4393
result = builder.createCooperativeMatrixPerElementOp(typeId, operands);
4394
// store the result to the pointer
4395
builder.createStore(result, operands[0]);
4396
result = 0;
4397
} else if (node->getOp() == glslang::EOpCooperativeMatrixTransposeNV) {
4398
4399
builder.addCapability(spv::Capability::CooperativeMatrixConversionsNV);
4400
builder.addExtension(spv::E_SPV_NV_cooperative_matrix2);
4401
4402
spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
4403
assert(builder.isCooperativeMatrixType(typeId));
4404
4405
result = builder.createUnaryOp(spv::Op::OpCooperativeMatrixTransposeNV, typeId, operands[1]);
4406
// store the result to the pointer
4407
builder.createStore(result, operands[0]);
4408
result = 0;
4409
} else if (node->getOp() == glslang::EOpBitCastArrayQCOM) {
4410
builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
4411
builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
4412
result = builder.createUnaryOp(spv::Op::OpBitCastArrayQCOM, resultType(), operands[0]);
4413
} else if (node->getOp() == glslang::EOpCompositeConstructCoopMatQCOM) {
4414
builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
4415
builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
4416
result = builder.createUnaryOp(spv::Op::OpCompositeConstructCoopMatQCOM, resultType(), operands[0]);
4417
} else if (node->getOp() == glslang::EOpCompositeExtractCoopMatQCOM) {
4418
builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
4419
builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
4420
result = builder.createUnaryOp(spv::Op::OpCompositeExtractCoopMatQCOM, resultType(), operands[0]);
4421
} else if (node->getOp() == glslang::EOpExtractSubArrayQCOM) {
4422
builder.addCapability(spv::Capability::CooperativeMatrixConversionQCOM);
4423
builder.addExtension(spv::E_SPV_QCOM_cooperative_matrix_conversion);
4424
4425
std::vector<spv::Id> arguments { operands[0], operands[1] };;
4426
result = builder.createOp(spv::Op::OpExtractSubArrayQCOM, resultType(), arguments);
4427
} else if (node->getOp() == glslang::EOpCooperativeVectorMatMulNV ||
4428
node->getOp() == glslang::EOpCooperativeVectorMatMulAddNV) {
4429
auto matrixOperands = spv::CooperativeMatrixOperandsMask::MaskNone;
4430
4431
bool isMulAdd = node->getOp() == glslang::EOpCooperativeVectorMatMulAddNV;
4432
4433
// Determine Cooperative Matrix Operands bits from the signedness of the types.
4434
4435
if (isTypeSignedInt(glslangOperands[1]->getAsTyped()->getBasicType()))
4436
addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixBSignedComponentsKHR);
4437
if (isTypeSignedInt(glslangOperands[0]->getAsTyped()->getBasicType()))
4438
addMask(matrixOperands, spv::CooperativeMatrixOperandsMask::MatrixResultSignedComponentsKHR);
4439
4440
uint32_t opIdx = 1;
4441
std::vector<spv::IdImmediate> idImmOps;
4442
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Input
4443
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // InputInterpretation
4444
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Matrix
4445
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixOffset
4446
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixInterpretation
4447
if (isMulAdd) {
4448
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Bias
4449
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // BiasOffset
4450
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // BiasInterpretation
4451
}
4452
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // M
4453
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // K
4454
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MemoryLayout
4455
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // Transpose
4456
idImmOps.push_back(spv::IdImmediate(true, operands[opIdx++])); // MatrixStride
4457
if (matrixOperands != spv::CooperativeMatrixOperandsMask::MaskNone)
4458
idImmOps.push_back(spv::IdImmediate(false, matrixOperands)); // Cooperative Matrix Operands
4459
4460
// get the pointee type
4461
spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
4462
assert(builder.isCooperativeVectorType(typeId));
4463
// do the op
4464
spv::Id result = builder.createOp(isMulAdd ? spv::Op::OpCooperativeVectorMatrixMulAddNV : spv::Op::OpCooperativeVectorMatrixMulNV, typeId, idImmOps);
4465
// store the result to the pointer (out param 'res')
4466
builder.createStore(result, operands[0]);
4467
result = 0;
4468
} else if (node->getOp() == glslang::EOpCooperativeVectorLoadNV) {
4469
std::vector<spv::IdImmediate> idImmOps;
4470
4471
idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
4472
idImmOps.push_back(spv::IdImmediate(true, operands[2])); // offset
4473
idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
4474
// get the pointee type
4475
spv::Id typeId = builder.getContainedTypeId(builder.getTypeId(operands[0]));
4476
assert(builder.isCooperativeVectorType(typeId));
4477
// do the op
4478
spv::Id result = builder.createOp(spv::Op::OpCooperativeVectorLoadNV, typeId, idImmOps);
4479
// store the result to the pointer (out param 'v')
4480
builder.createStore(result, operands[0]);
4481
result = 0;
4482
} else if (node->getOp() == glslang::EOpCooperativeVectorStoreNV) {
4483
std::vector<spv::IdImmediate> idImmOps;
4484
4485
idImmOps.push_back(spv::IdImmediate(true, operands[1])); // buf
4486
idImmOps.push_back(spv::IdImmediate(true, operands[2])); // offset
4487
idImmOps.push_back(spv::IdImmediate(true, operands[0])); // object
4488
idImmOps.insert(idImmOps.end(), memoryAccessOperands.begin(), memoryAccessOperands.end());
4489
builder.createNoResultOp(spv::Op::OpCooperativeVectorStoreNV, idImmOps);
4490
result = 0;
4491
} else if (node->getOp() == glslang::EOpCooperativeVectorOuterProductAccumulateNV) {
4492
builder.addCapability(spv::Capability::CooperativeVectorTrainingNV);
4493
builder.addExtension(spv::E_SPV_NV_cooperative_vector);
4494
4495
std::vector<spv::IdImmediate> idImmOps;
4496
4497
idImmOps.push_back(spv::IdImmediate(true, operands[2])); // Matrix
4498
idImmOps.push_back(spv::IdImmediate(true, operands[3])); // Offset
4499
idImmOps.push_back(spv::IdImmediate(true, operands[0])); // A
4500
idImmOps.push_back(spv::IdImmediate(true, operands[1])); // B
4501
idImmOps.push_back(spv::IdImmediate(true, operands[5])); // MemoryLayout
4502
idImmOps.push_back(spv::IdImmediate(true, operands[6])); // MatrixInterpretation
4503
idImmOps.push_back(spv::IdImmediate(true, operands[4])); // Stride
4504
builder.createNoResultOp(spv::Op::OpCooperativeVectorOuterProductAccumulateNV, idImmOps);
4505
result = 0;
4506
} else if (node->getOp() == glslang::EOpCooperativeVectorReduceSumAccumulateNV) {
4507
builder.addCapability(spv::Capability::CooperativeVectorTrainingNV);
4508
builder.addExtension(spv::E_SPV_NV_cooperative_vector);
4509
4510
std::vector<spv::IdImmediate> idImmOps;
4511
4512
idImmOps.push_back(spv::IdImmediate(true, operands[1])); // Buf
4513
idImmOps.push_back(spv::IdImmediate(true, operands[2])); // Offset
4514
idImmOps.push_back(spv::IdImmediate(true, operands[0])); // A
4515
builder.createNoResultOp(spv::Op::OpCooperativeVectorReduceSumAccumulateNV, idImmOps);
4516
result = 0;
4517
} else if (node->getOp() == glslang::EOpTensorReadARM ||
4518
node->getOp() == glslang::EOpTensorWriteARM) {
4519
const bool isWrite = node->getOp() == glslang::EOpTensorWriteARM;
4520
const unsigned int tensorMinOperandCount = 3;
4521
assert(operands.size() >= tensorMinOperandCount);
4522
std::vector<spv::IdImmediate> idImmOps;
4523
4524
idImmOps.push_back(spv::IdImmediate(true, operands[0])); // tensor
4525
idImmOps.push_back(spv::IdImmediate(true, operands[1])); // coords
4526
if (isWrite) {
4527
idImmOps.push_back(spv::IdImmediate(true, operands[2])); // value
4528
}
4529
4530
// Analyze the tensor operands
4531
spv::IdImmediate tensorOperands = { false, uint32_t(spv::TensorOperandsMask::MaskNone) };
4532
bool pushExtraArg = false;
4533
if (operands.size() > tensorMinOperandCount) {
4534
auto enumVal = builder.getConstantScalar(operands[tensorMinOperandCount]);
4535
4536
if (enumVal & uint32_t(spv::TensorOperandsMask::NontemporalARM)) {
4537
tensorOperands.word |= uint32_t(spv::TensorOperandsMask::NontemporalARM);
4538
}
4539
if (enumVal & uint32_t(spv::TensorOperandsMask::OutOfBoundsValueARM)) {
4540
tensorOperands.word |= uint32_t(spv::TensorOperandsMask::OutOfBoundsValueARM);
4541
assert(operands.size() >= tensorMinOperandCount + 2 &&
4542
"TensorOperandsOutOfBoundsValueMask requires an additional value");
4543
pushExtraArg = true;
4544
}
4545
}
4546
4547
// Append optional tensor operands if the mask was non-zero.
4548
if (tensorOperands.word) {
4549
idImmOps.push_back(tensorOperands);
4550
if (pushExtraArg)
4551
idImmOps.push_back(spv::IdImmediate(true, operands[tensorMinOperandCount + 1]));
4552
}
4553
4554
if (isWrite) {
4555
builder.createNoResultOp(spv::Op::OpTensorWriteARM, idImmOps);
4556
result = 0;
4557
} else {
4558
// Use the result argument type as the OpTensorReadARM result type.
4559
const glslang::TType &resArgType = glslangOperands[2]->getAsTyped()->getType();
4560
spv::Id retType = convertGlslangToSpvType(resArgType);
4561
result = builder.createOp(spv::Op::OpTensorReadARM, retType, idImmOps);
4562
// Store the result to the result argument.
4563
builder.createStore(result, operands[2]);
4564
}
4565
} else if (node->getOp() == glslang::EOpTensorSizeARM) {
4566
// Expected operands are (tensor, dimension)
4567
assert(operands.size() == 2);
4568
4569
spv::Id tensorOp = operands[0];
4570
spv::Id dimOp = operands[1];
4571
assert(builder.isTensorTypeARM(builder.getTypeId(tensorOp)) && "operand #0 must be a tensor");
4572
4573
std::vector<spv::IdImmediate> idImmOps;
4574
idImmOps.push_back(spv::IdImmediate(true, tensorOp));
4575
idImmOps.push_back(spv::IdImmediate(true, dimOp));
4576
result = builder.createOp(spv::Op::OpTensorQuerySizeARM, resultType(), idImmOps);
4577
} else if (atomic) {
4578
// Handle all atomics
4579
glslang::TBasicType typeProxy = (node->getOp() == glslang::EOpAtomicStore)
4580
? node->getSequence()[0]->getAsTyped()->getBasicType() : node->getBasicType();
4581
result = createAtomicOperation(node->getOp(), precision, resultType(), operands, typeProxy,
4582
lvalueCoherentFlags, node->getType());
4583
} else if (node->getOp() == glslang::EOpSpirvInst) {
4584
const auto& spirvInst = node->getSpirvInstruction();
4585
if (spirvInst.set == "") {
4586
std::vector<spv::IdImmediate> idImmOps;
4587
for (unsigned int i = 0; i < glslangOperands.size(); ++i) {
4588
if (glslangOperands[i]->getAsTyped()->getQualifier().isSpirvLiteral()) {
4589
// Translate the constant to a literal value
4590
std::vector<unsigned> literals;
4591
glslang::TVector<const glslang::TIntermConstantUnion*> constants;
4592
constants.push_back(glslangOperands[i]->getAsConstantUnion());
4593
TranslateLiterals(constants, literals);
4594
idImmOps.push_back({false, literals[0]});
4595
} else
4596
idImmOps.push_back({true, operands[i]});
4597
}
4598
4599
if (node->getBasicType() == glslang::EbtVoid)
4600
builder.createNoResultOp(static_cast<spv::Op>(spirvInst.id), idImmOps);
4601
else
4602
result = builder.createOp(static_cast<spv::Op>(spirvInst.id), resultType(), idImmOps);
4603
} else {
4604
result = builder.createBuiltinCall(
4605
resultType(), spirvInst.set == "GLSL.std.450" ? stdBuiltins : getExtBuiltins(spirvInst.set.c_str()),
4606
spirvInst.id, operands);
4607
}
4608
noReturnValue = node->getBasicType() == glslang::EbtVoid;
4609
} else if (node->getOp() == glslang::EOpDebugPrintf) {
4610
if (!nonSemanticDebugPrintf) {
4611
nonSemanticDebugPrintf = builder.import("NonSemantic.DebugPrintf");
4612
}
4613
result = builder.createBuiltinCall(builder.makeVoidType(), nonSemanticDebugPrintf, spv::NonSemanticDebugPrintfDebugPrintf, operands);
4614
builder.addExtension(spv::E_SPV_KHR_non_semantic_info);
4615
} else {
4616
// Pass through to generic operations.
4617
switch (glslangOperands.size()) {
4618
case 0:
4619
result = createNoArgOperation(node->getOp(), precision, resultType());
4620
break;
4621
case 1:
4622
{
4623
OpDecorations decorations = { precision,
4624
TranslateNoContractionDecoration(node->getType().getQualifier()),
4625
TranslateNonUniformDecoration(node->getType().getQualifier()) };
4626
result = createUnaryOperation(
4627
node->getOp(), decorations,
4628
resultType(), operands.front(),
4629
glslangOperands[0]->getAsTyped()->getBasicType(), lvalueCoherentFlags, node->getType());
4630
}
4631
break;
4632
default:
4633
result = createMiscOperation(node->getOp(), precision, resultType(), operands, node->getBasicType());
4634
break;
4635
}
4636
4637
if (invertedType != spv::NoResult)
4638
result = createInvertedSwizzle(precision, *glslangOperands[0]->getAsBinaryNode(), result);
4639
4640
for (unsigned int i = 0; i < temporaryLvalues.size(); ++i) {
4641
builder.setAccessChain(complexLvalues[i]);
4642
builder.accessChainStore(builder.createLoad(temporaryLvalues[i], spv::NoPrecision),
4643
TranslateNonUniformDecoration(complexLvalues[i].coherentFlags));
4644
}
4645
}
4646
4647
if (noReturnValue)
4648
return false;
4649
4650
if (! result) {
4651
logger->missingFunctionality("unknown glslang aggregate");
4652
return true; // pick up a child as a placeholder operand
4653
} else {
4654
builder.clearAccessChain();
4655
builder.setAccessChainRValue(result);
4656
return false;
4657
}
4658
}
4659
4660
// This path handles both if-then-else and ?:
4661
// The if-then-else has a node type of void, while
4662
// ?: has either a void or a non-void node type
4663
//
4664
// Leaving the result, when not void:
4665
// GLSL only has r-values as the result of a :?, but
4666
// if we have an l-value, that can be more efficient if it will
4667
// become the base of a complex r-value expression, because the
4668
// next layer copies r-values into memory to use the access-chain mechanism
4669
bool TGlslangToSpvTraverser::visitSelection(glslang::TVisit /* visit */, glslang::TIntermSelection* node)
4670
{
4671
// see if OpSelect can handle it
4672
const auto isOpSelectable = [&]() {
4673
if (node->getBasicType() == glslang::EbtVoid)
4674
return false;
4675
// OpSelect can do all other types starting with SPV 1.4
4676
if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_4) {
4677
// pre-1.4, only scalars and vectors can be handled
4678
if ((!node->getType().isScalar() && !node->getType().isVector()))
4679
return false;
4680
}
4681
return true;
4682
};
4683
4684
// See if it simple and safe, or required, to execute both sides.
4685
// Crucially, side effects must be either semantically required or avoided,
4686
// and there are performance trade-offs.
4687
// Return true if required or a good idea (and safe) to execute both sides,
4688
// false otherwise.
4689
const auto bothSidesPolicy = [&]() -> bool {
4690
// do we have both sides?
4691
if (node->getTrueBlock() == nullptr ||
4692
node->getFalseBlock() == nullptr)
4693
return false;
4694
4695
// required? (unless we write additional code to look for side effects
4696
// and make performance trade-offs if none are present)
4697
if (!node->getShortCircuit())
4698
return true;
4699
4700
// if not required to execute both, decide based on performance/practicality...
4701
4702
if (!isOpSelectable())
4703
return false;
4704
4705
assert(node->getType() == node->getTrueBlock() ->getAsTyped()->getType() &&
4706
node->getType() == node->getFalseBlock()->getAsTyped()->getType());
4707
4708
// return true if a single operand to ? : is okay for OpSelect
4709
const auto operandOkay = [](glslang::TIntermTyped* node) {
4710
return node->getAsSymbolNode() || node->getType().getQualifier().isConstant();
4711
};
4712
4713
return operandOkay(node->getTrueBlock() ->getAsTyped()) &&
4714
operandOkay(node->getFalseBlock()->getAsTyped());
4715
};
4716
4717
spv::Id result = spv::NoResult; // upcoming result selecting between trueValue and falseValue
4718
// emit the condition before doing anything with selection
4719
node->getCondition()->traverse(this);
4720
spv::Id condition = accessChainLoad(node->getCondition()->getType());
4721
4722
// Find a way of executing both sides and selecting the right result.
4723
const auto executeBothSides = [&]() -> void {
4724
// execute both sides
4725
spv::Id resultType = convertGlslangToSpvType(node->getType());
4726
node->getTrueBlock()->traverse(this);
4727
spv::Id trueValue = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());
4728
node->getFalseBlock()->traverse(this);
4729
spv::Id falseValue = accessChainLoad(node->getFalseBlock()->getAsTyped()->getType());
4730
4731
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
4732
4733
// done if void
4734
if (node->getBasicType() == glslang::EbtVoid)
4735
return;
4736
4737
// emit code to select between trueValue and falseValue
4738
// see if OpSelect can handle the result type, and that the SPIR-V types
4739
// of the inputs match the result type.
4740
if (isOpSelectable()) {
4741
// Emit OpSelect for this selection.
4742
4743
// smear condition to vector, if necessary (AST is always scalar)
4744
// Before 1.4, smear like for mix(), starting with 1.4, keep it scalar
4745
if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_4 && builder.isVector(trueValue)) {
4746
condition = builder.smearScalar(spv::NoPrecision, condition,
4747
builder.makeVectorType(builder.makeBoolType(),
4748
builder.getNumComponents(trueValue)));
4749
}
4750
4751
// If the types do not match, it is because of mismatched decorations on aggregates.
4752
// Since isOpSelectable only lets us get here for SPIR-V >= 1.4, we can use OpCopyObject
4753
// to get matching types.
4754
if (builder.getTypeId(trueValue) != resultType) {
4755
trueValue = builder.createUnaryOp(spv::Op::OpCopyLogical, resultType, trueValue);
4756
}
4757
if (builder.getTypeId(falseValue) != resultType) {
4758
falseValue = builder.createUnaryOp(spv::Op::OpCopyLogical, resultType, falseValue);
4759
}
4760
4761
// OpSelect
4762
result = builder.createTriOp(spv::Op::OpSelect, resultType, condition, trueValue, falseValue);
4763
4764
builder.clearAccessChain();
4765
builder.setAccessChainRValue(result);
4766
} else {
4767
// We need control flow to select the result.
4768
// TODO: Once SPIR-V OpSelect allows arbitrary types, eliminate this path.
4769
result = builder.createVariable(TranslatePrecisionDecoration(node->getType()),
4770
spv::StorageClass::Function, resultType);
4771
4772
// Selection control:
4773
const spv::SelectionControlMask control = TranslateSelectionControl(*node);
4774
4775
// make an "if" based on the value created by the condition
4776
spv::Builder::If ifBuilder(condition, control, builder);
4777
4778
// emit the "then" statement
4779
builder.clearAccessChain();
4780
builder.setAccessChainLValue(result);
4781
multiTypeStore(node->getType(), trueValue);
4782
4783
ifBuilder.makeBeginElse();
4784
// emit the "else" statement
4785
builder.clearAccessChain();
4786
builder.setAccessChainLValue(result);
4787
multiTypeStore(node->getType(), falseValue);
4788
4789
// finish off the control flow
4790
ifBuilder.makeEndIf();
4791
4792
builder.clearAccessChain();
4793
builder.setAccessChainLValue(result);
4794
}
4795
};
4796
4797
// Execute the one side needed, as per the condition
4798
const auto executeOneSide = [&]() {
4799
// Always emit control flow.
4800
if (node->getBasicType() != glslang::EbtVoid) {
4801
result = builder.createVariable(TranslatePrecisionDecoration(node->getType()), spv::StorageClass::Function,
4802
convertGlslangToSpvType(node->getType()));
4803
}
4804
4805
// Selection control:
4806
const spv::SelectionControlMask control = TranslateSelectionControl(*node);
4807
4808
// make an "if" based on the value created by the condition
4809
spv::Builder::If ifBuilder(condition, control, builder);
4810
4811
// emit the "then" statement
4812
if (node->getTrueBlock() != nullptr) {
4813
node->getTrueBlock()->traverse(this);
4814
if (result != spv::NoResult) {
4815
spv::Id load = accessChainLoad(node->getTrueBlock()->getAsTyped()->getType());
4816
4817
builder.clearAccessChain();
4818
builder.setAccessChainLValue(result);
4819
multiTypeStore(node->getType(), load);
4820
}
4821
}
4822
4823
if (node->getFalseBlock() != nullptr) {
4824
ifBuilder.makeBeginElse();
4825
// emit the "else" statement
4826
node->getFalseBlock()->traverse(this);
4827
if (result != spv::NoResult) {
4828
spv::Id load = accessChainLoad(node->getFalseBlock()->getAsTyped()->getType());
4829
4830
builder.clearAccessChain();
4831
builder.setAccessChainLValue(result);
4832
multiTypeStore(node->getType(), load);
4833
}
4834
}
4835
4836
// finish off the control flow
4837
ifBuilder.makeEndIf();
4838
4839
if (result != spv::NoResult) {
4840
builder.clearAccessChain();
4841
builder.setAccessChainLValue(result);
4842
}
4843
};
4844
4845
// Try for OpSelect (or a requirement to execute both sides)
4846
if (bothSidesPolicy()) {
4847
SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
4848
if (node->getType().getQualifier().isSpecConstant())
4849
spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
4850
executeBothSides();
4851
} else
4852
executeOneSide();
4853
4854
return false;
4855
}
4856
4857
bool TGlslangToSpvTraverser::visitSwitch(glslang::TVisit /* visit */, glslang::TIntermSwitch* node)
4858
{
4859
// emit and get the condition before doing anything with switch
4860
node->getCondition()->traverse(this);
4861
spv::Id selector = accessChainLoad(node->getCondition()->getAsTyped()->getType());
4862
4863
// Selection control:
4864
const spv::SelectionControlMask control = TranslateSwitchControl(*node);
4865
4866
// browse the children to sort out code segments
4867
int defaultSegment = -1;
4868
std::vector<TIntermNode*> codeSegments;
4869
glslang::TIntermSequence& sequence = node->getBody()->getSequence();
4870
std::vector<int> caseValues;
4871
std::vector<int> valueIndexToSegment(sequence.size()); // note: probably not all are used, it is an overestimate
4872
for (glslang::TIntermSequence::iterator c = sequence.begin(); c != sequence.end(); ++c) {
4873
TIntermNode* child = *c;
4874
if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpDefault)
4875
defaultSegment = (int)codeSegments.size();
4876
else if (child->getAsBranchNode() && child->getAsBranchNode()->getFlowOp() == glslang::EOpCase) {
4877
valueIndexToSegment[caseValues.size()] = (int)codeSegments.size();
4878
caseValues.push_back(child->getAsBranchNode()->getExpression()->getAsConstantUnion()
4879
->getConstArray()[0].getIConst());
4880
} else
4881
codeSegments.push_back(child);
4882
}
4883
4884
// handle the case where the last code segment is missing, due to no code
4885
// statements between the last case and the end of the switch statement
4886
if ((caseValues.size() && (int)codeSegments.size() == valueIndexToSegment[caseValues.size() - 1]) ||
4887
(int)codeSegments.size() == defaultSegment)
4888
codeSegments.push_back(nullptr);
4889
4890
// make the switch statement
4891
std::vector<spv::Block*> segmentBlocks; // returned, as the blocks allocated in the call
4892
builder.makeSwitch(selector, control, (int)codeSegments.size(), caseValues, valueIndexToSegment, defaultSegment,
4893
segmentBlocks);
4894
4895
// emit all the code in the segments
4896
breakForLoop.push(false);
4897
for (unsigned int s = 0; s < codeSegments.size(); ++s) {
4898
builder.nextSwitchSegment(segmentBlocks, s);
4899
if (codeSegments[s])
4900
codeSegments[s]->traverse(this);
4901
else
4902
builder.addSwitchBreak(true);
4903
}
4904
breakForLoop.pop();
4905
4906
builder.endSwitch(segmentBlocks);
4907
4908
return false;
4909
}
4910
4911
void TGlslangToSpvTraverser::visitConstantUnion(glslang::TIntermConstantUnion* node)
4912
{
4913
if (node->getQualifier().isSpirvLiteral())
4914
return; // Translated to a literal value, skip further processing
4915
4916
int nextConst = 0;
4917
spv::Id constant = createSpvConstantFromConstUnionArray(node->getType(), node->getConstArray(), nextConst, false);
4918
4919
builder.clearAccessChain();
4920
builder.setAccessChainRValue(constant);
4921
}
4922
4923
bool TGlslangToSpvTraverser::visitLoop(glslang::TVisit /* visit */, glslang::TIntermLoop* node)
4924
{
4925
auto blocks = builder.makeNewLoop();
4926
builder.createBranch(true, &blocks.head);
4927
4928
// Loop control:
4929
std::vector<unsigned int> operands;
4930
const spv::LoopControlMask control = TranslateLoopControl(*node, operands);
4931
4932
// Spec requires back edges to target header blocks, and every header block
4933
// must dominate its merge block. Make a header block first to ensure these
4934
// conditions are met. By definition, it will contain OpLoopMerge, followed
4935
// by a block-ending branch. But we don't want to put any other body/test
4936
// instructions in it, since the body/test may have arbitrary instructions,
4937
// including merges of its own.
4938
builder.setBuildPoint(&blocks.head);
4939
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
4940
builder.createLoopMerge(&blocks.merge, &blocks.continue_target, control, operands);
4941
if (node->testFirst() && node->getTest()) {
4942
spv::Block& test = builder.makeNewBlock();
4943
builder.createBranch(true, &test);
4944
4945
builder.setBuildPoint(&test);
4946
node->getTest()->traverse(this);
4947
spv::Id condition = accessChainLoad(node->getTestExpr()->getType());
4948
builder.createConditionalBranch(condition, &blocks.body, &blocks.merge);
4949
4950
builder.setBuildPoint(&blocks.body);
4951
breakForLoop.push(true);
4952
if (node->getBody())
4953
node->getBody()->traverse(this);
4954
builder.createBranch(true, &blocks.continue_target);
4955
breakForLoop.pop();
4956
4957
builder.setBuildPoint(&blocks.continue_target);
4958
if (node->getTerminal())
4959
node->getTerminal()->traverse(this);
4960
builder.createBranch(true, &blocks.head);
4961
} else {
4962
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
4963
builder.createBranch(true, &blocks.body);
4964
4965
breakForLoop.push(true);
4966
builder.setBuildPoint(&blocks.body);
4967
if (node->getBody())
4968
node->getBody()->traverse(this);
4969
builder.createBranch(true, &blocks.continue_target);
4970
breakForLoop.pop();
4971
4972
builder.setBuildPoint(&blocks.continue_target);
4973
if (node->getTerminal())
4974
node->getTerminal()->traverse(this);
4975
if (node->getTest()) {
4976
node->getTest()->traverse(this);
4977
spv::Id condition =
4978
accessChainLoad(node->getTestExpr()->getType());
4979
builder.createConditionalBranch(condition, &blocks.head, &blocks.merge);
4980
} else {
4981
// TODO: unless there was a break/return/discard instruction
4982
// somewhere in the body, this is an infinite loop, so we should
4983
// issue a warning.
4984
builder.createBranch(true, &blocks.head);
4985
}
4986
}
4987
builder.setBuildPoint(&blocks.merge);
4988
builder.closeLoop();
4989
return false;
4990
}
4991
4992
bool TGlslangToSpvTraverser::visitBranch(glslang::TVisit /* visit */, glslang::TIntermBranch* node)
4993
{
4994
if (node->getExpression())
4995
node->getExpression()->traverse(this);
4996
4997
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
4998
4999
switch (node->getFlowOp()) {
5000
case glslang::EOpKill:
5001
if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
5002
builder.addCapability(spv::Capability::DemoteToHelperInvocation);
5003
builder.createNoResultOp(spv::Op::OpDemoteToHelperInvocationEXT);
5004
} else {
5005
builder.makeStatementTerminator(spv::Op::OpKill, "post-discard");
5006
}
5007
break;
5008
case glslang::EOpTerminateInvocation:
5009
builder.addExtension(spv::E_SPV_KHR_terminate_invocation);
5010
builder.makeStatementTerminator(spv::Op::OpTerminateInvocation, "post-terminate-invocation");
5011
break;
5012
case glslang::EOpBreak:
5013
if (breakForLoop.top())
5014
builder.createLoopExit();
5015
else
5016
builder.addSwitchBreak(false);
5017
break;
5018
case glslang::EOpContinue:
5019
builder.createLoopContinue();
5020
break;
5021
case glslang::EOpReturn:
5022
if (node->getExpression() != nullptr) {
5023
const glslang::TType& glslangReturnType = node->getExpression()->getType();
5024
spv::Id returnId = accessChainLoad(glslangReturnType);
5025
if (builder.getTypeId(returnId) != currentFunction->getReturnType() ||
5026
TranslatePrecisionDecoration(glslangReturnType) != currentFunction->getReturnPrecision()) {
5027
builder.clearAccessChain();
5028
spv::Id copyId = builder.createVariable(currentFunction->getReturnPrecision(),
5029
spv::StorageClass::Function, currentFunction->getReturnType());
5030
builder.setAccessChainLValue(copyId);
5031
multiTypeStore(glslangReturnType, returnId);
5032
returnId = builder.createLoad(copyId, currentFunction->getReturnPrecision());
5033
}
5034
builder.makeReturn(false, returnId);
5035
} else
5036
builder.makeReturn(false);
5037
5038
builder.clearAccessChain();
5039
break;
5040
5041
case glslang::EOpDemote:
5042
builder.createNoResultOp(spv::Op::OpDemoteToHelperInvocationEXT);
5043
builder.addExtension(spv::E_SPV_EXT_demote_to_helper_invocation);
5044
builder.addCapability(spv::Capability::DemoteToHelperInvocationEXT);
5045
break;
5046
case glslang::EOpTerminateRayKHR:
5047
builder.makeStatementTerminator(spv::Op::OpTerminateRayKHR, "post-terminateRayKHR");
5048
break;
5049
case glslang::EOpIgnoreIntersectionKHR:
5050
builder.makeStatementTerminator(spv::Op::OpIgnoreIntersectionKHR, "post-ignoreIntersectionKHR");
5051
break;
5052
5053
default:
5054
assert(0);
5055
break;
5056
}
5057
5058
return false;
5059
}
5060
5061
bool TGlslangToSpvTraverser::visitVariableDecl(glslang::TVisit visit, glslang::TIntermVariableDecl* node)
5062
{
5063
if (visit == glslang::EvPreVisit) {
5064
builder.setDebugSourceLocation(node->getDeclSymbol()->getLoc().line, node->getDeclSymbol()->getLoc().getFilename());
5065
// We touch the symbol once here to create the debug info.
5066
getSymbolId(node->getDeclSymbol());
5067
}
5068
5069
return true;
5070
}
5071
5072
5073
spv::Id TGlslangToSpvTraverser::createSpvVariable(const glslang::TIntermSymbol* node, spv::Id forcedType)
5074
{
5075
// First, steer off constants, which are not SPIR-V variables, but
5076
// can still have a mapping to a SPIR-V Id.
5077
// This includes specialization constants.
5078
if (node->getQualifier().isConstant()) {
5079
spv::Id result = createSpvConstant(*node);
5080
if (result != spv::NoResult) {
5081
auto name = node->getAsSymbolNode()->getAccessName().c_str();
5082
auto typeId = convertGlslangToSpvType(node->getType());
5083
builder.createConstVariable(typeId, name, result, currentFunction == nullptr);
5084
return result;
5085
}
5086
}
5087
5088
// Now, handle actual variables
5089
spv::StorageClass storageClass = TranslateStorageClass(node->getType());
5090
spv::Id spvType = forcedType == spv::NoType ? convertGlslangToSpvType(node->getType())
5091
: forcedType;
5092
5093
const bool contains16BitType = node->getType().contains16BitFloat() ||
5094
node->getType().contains16BitInt();
5095
if (contains16BitType) {
5096
switch (storageClass) {
5097
case spv::StorageClass::Input:
5098
case spv::StorageClass::Output:
5099
builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
5100
builder.addCapability(spv::Capability::StorageInputOutput16);
5101
break;
5102
case spv::StorageClass::Uniform:
5103
builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
5104
if (node->getType().getQualifier().storage == glslang::EvqBuffer)
5105
builder.addCapability(spv::Capability::StorageUniformBufferBlock16);
5106
else
5107
builder.addCapability(spv::Capability::StorageUniform16);
5108
break;
5109
case spv::StorageClass::PushConstant:
5110
builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
5111
builder.addCapability(spv::Capability::StoragePushConstant16);
5112
break;
5113
case spv::StorageClass::StorageBuffer:
5114
case spv::StorageClass::PhysicalStorageBufferEXT:
5115
builder.addIncorporatedExtension(spv::E_SPV_KHR_16bit_storage, spv::Spv_1_3);
5116
builder.addCapability(spv::Capability::StorageUniformBufferBlock16);
5117
break;
5118
case spv::StorageClass::TileAttachmentQCOM:
5119
builder.addCapability(spv::Capability::TileShadingQCOM);
5120
break;
5121
default:
5122
if (storageClass == spv::StorageClass::Workgroup &&
5123
node->getType().getBasicType() == glslang::EbtBlock) {
5124
builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayout16BitAccessKHR);
5125
break;
5126
}
5127
if (node->getType().contains16BitFloat())
5128
builder.addCapability(spv::Capability::Float16);
5129
if (node->getType().contains16BitInt())
5130
builder.addCapability(spv::Capability::Int16);
5131
break;
5132
}
5133
}
5134
5135
if (node->getType().contains8BitInt()) {
5136
if (storageClass == spv::StorageClass::PushConstant) {
5137
builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
5138
builder.addCapability(spv::Capability::StoragePushConstant8);
5139
} else if (storageClass == spv::StorageClass::Uniform) {
5140
builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
5141
builder.addCapability(spv::Capability::UniformAndStorageBuffer8BitAccess);
5142
} else if (storageClass == spv::StorageClass::StorageBuffer) {
5143
builder.addIncorporatedExtension(spv::E_SPV_KHR_8bit_storage, spv::Spv_1_5);
5144
builder.addCapability(spv::Capability::StorageBuffer8BitAccess);
5145
} else if (storageClass == spv::StorageClass::Workgroup &&
5146
node->getType().getBasicType() == glslang::EbtBlock) {
5147
builder.addCapability(spv::Capability::WorkgroupMemoryExplicitLayout8BitAccessKHR);
5148
} else {
5149
builder.addCapability(spv::Capability::Int8);
5150
}
5151
}
5152
5153
const char* name = node->getName().c_str();
5154
if (glslang::IsAnonymous(name))
5155
name = "";
5156
5157
spv::Id initializer = spv::NoResult;
5158
5159
if (node->getType().getQualifier().storage == glslang::EvqUniform && !node->getConstArray().empty()) {
5160
int nextConst = 0;
5161
initializer = createSpvConstantFromConstUnionArray(node->getType(),
5162
node->getConstArray(),
5163
nextConst,
5164
false /* specConst */);
5165
} else if (node->getType().getQualifier().isNullInit()) {
5166
initializer = builder.makeNullConstant(spvType);
5167
}
5168
5169
spv::Id var = builder.createVariable(spv::NoPrecision, storageClass, spvType, name, initializer, false);
5170
5171
if (options.emitNonSemanticShaderDebugInfo && storageClass != spv::StorageClass::Function) {
5172
// Create variable alias for retargeted symbols if any.
5173
// Notably, this is only applicable to built-in variables so that it is okay to only use name as the key.
5174
auto [itBegin, itEnd] = glslangIntermediate->getBuiltinAliasLookup().equal_range(name);
5175
for (auto it = itBegin; it != itEnd; ++it) {
5176
builder.createDebugGlobalVariable(builder.getDebugType(spvType), it->second.c_str(), var);
5177
}
5178
}
5179
5180
std::vector<spv::Decoration> topLevelDecorations;
5181
glslang::TQualifier typeQualifier = node->getType().getQualifier();
5182
TranslateMemoryDecoration(typeQualifier, topLevelDecorations, glslangIntermediate->usingVulkanMemoryModel());
5183
for (auto deco : topLevelDecorations) {
5184
#ifdef __APPLE__
5185
if (deco != spv::Decoration::Restrict &&
5186
deco != spv::Decoration::RestrictPointer &&
5187
deco != spv::Decoration::RestrictPointerEXT)
5188
#endif
5189
builder.addDecoration(var, deco);
5190
}
5191
return var;
5192
}
5193
5194
// Return type Id of the sampled type.
5195
spv::Id TGlslangToSpvTraverser::getSampledType(const glslang::TSampler& sampler)
5196
{
5197
switch (sampler.type) {
5198
case glslang::EbtInt: return builder.makeIntType(32);
5199
case glslang::EbtUint: return builder.makeUintType(32);
5200
case glslang::EbtFloat: return builder.makeFloatType(32);
5201
case glslang::EbtFloat16:
5202
builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float_fetch);
5203
builder.addCapability(spv::Capability::Float16ImageAMD);
5204
return builder.makeFloatType(16);
5205
case glslang::EbtInt64:
5206
builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
5207
builder.addCapability(spv::Capability::Int64ImageEXT);
5208
return builder.makeIntType(64);
5209
case glslang::EbtUint64:
5210
builder.addExtension(spv::E_SPV_EXT_shader_image_int64);
5211
builder.addCapability(spv::Capability::Int64ImageEXT);
5212
return builder.makeUintType(64);
5213
default:
5214
assert(0);
5215
return builder.makeFloatType(32);
5216
}
5217
}
5218
5219
// If node is a swizzle operation, return the type that should be used if
5220
// the swizzle base is first consumed by another operation, before the swizzle
5221
// is applied.
5222
spv::Id TGlslangToSpvTraverser::getInvertedSwizzleType(const glslang::TIntermTyped& node)
5223
{
5224
if (node.getAsOperator() &&
5225
node.getAsOperator()->getOp() == glslang::EOpVectorSwizzle)
5226
return convertGlslangToSpvType(node.getAsBinaryNode()->getLeft()->getType());
5227
else
5228
return spv::NoType;
5229
}
5230
5231
// When inverting a swizzle with a parent op, this function
5232
// will apply the swizzle operation to a completed parent operation.
5233
spv::Id TGlslangToSpvTraverser::createInvertedSwizzle(spv::Decoration precision, const glslang::TIntermTyped& node,
5234
spv::Id parentResult)
5235
{
5236
std::vector<unsigned> swizzle;
5237
convertSwizzle(*node.getAsBinaryNode()->getRight()->getAsAggregate(), swizzle);
5238
return builder.createRvalueSwizzle(precision, convertGlslangToSpvType(node.getType()), parentResult, swizzle);
5239
}
5240
5241
// Convert a glslang AST swizzle node to a swizzle vector for building SPIR-V.
5242
void TGlslangToSpvTraverser::convertSwizzle(const glslang::TIntermAggregate& node, std::vector<unsigned>& swizzle)
5243
{
5244
const glslang::TIntermSequence& swizzleSequence = node.getSequence();
5245
for (int i = 0; i < (int)swizzleSequence.size(); ++i)
5246
swizzle.push_back(swizzleSequence[i]->getAsConstantUnion()->getConstArray()[0].getIConst());
5247
}
5248
5249
// Convert from a glslang type to an SPV type, by calling into a
5250
// recursive version of this function. This establishes the inherited
5251
// layout state rooted from the top-level type.
5252
spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type, bool forwardReferenceOnly)
5253
{
5254
return convertGlslangToSpvType(type, getExplicitLayout(type), type.getQualifier(), false, forwardReferenceOnly);
5255
}
5256
5257
spv::LinkageType TGlslangToSpvTraverser::convertGlslangLinkageToSpv(glslang::TLinkType linkType)
5258
{
5259
switch (linkType) {
5260
case glslang::ELinkExport:
5261
return spv::LinkageType::Export;
5262
default:
5263
return spv::LinkageType::Max;
5264
}
5265
}
5266
5267
// Do full recursive conversion of an arbitrary glslang type to a SPIR-V Id.
5268
// explicitLayout can be kept the same throughout the hierarchical recursive walk.
5269
// Mutually recursive with convertGlslangStructToSpvType().
5270
spv::Id TGlslangToSpvTraverser::convertGlslangToSpvType(const glslang::TType& type,
5271
glslang::TLayoutPacking explicitLayout, const glslang::TQualifier& qualifier,
5272
bool lastBufferBlockMember, bool forwardReferenceOnly)
5273
{
5274
spv::Id spvType = spv::NoResult;
5275
5276
switch (type.getBasicType()) {
5277
case glslang::EbtVoid:
5278
spvType = builder.makeVoidType();
5279
assert (! type.isArray());
5280
break;
5281
case glslang::EbtBool:
5282
// "transparent" bool doesn't exist in SPIR-V. The GLSL convention is
5283
// a 32-bit int where non-0 means true.
5284
if (explicitLayout != glslang::ElpNone)
5285
spvType = builder.makeUintType(32);
5286
else
5287
spvType = builder.makeBoolType();
5288
break;
5289
case glslang::EbtInt:
5290
spvType = builder.makeIntType(32);
5291
break;
5292
case glslang::EbtUint:
5293
spvType = builder.makeUintType(32);
5294
break;
5295
case glslang::EbtFloat:
5296
spvType = builder.makeFloatType(32);
5297
break;
5298
case glslang::EbtDouble:
5299
spvType = builder.makeFloatType(64);
5300
break;
5301
case glslang::EbtFloat16:
5302
spvType = builder.makeFloatType(16);
5303
break;
5304
case glslang::EbtBFloat16:
5305
spvType = builder.makeBFloat16Type();
5306
break;
5307
case glslang::EbtFloatE5M2:
5308
spvType = builder.makeFloatE5M2Type();
5309
break;
5310
case glslang::EbtFloatE4M3:
5311
spvType = builder.makeFloatE4M3Type();
5312
break;
5313
case glslang::EbtInt8:
5314
spvType = builder.makeIntType(8);
5315
break;
5316
case glslang::EbtUint8:
5317
spvType = builder.makeUintType(8);
5318
break;
5319
case glslang::EbtInt16:
5320
spvType = builder.makeIntType(16);
5321
break;
5322
case glslang::EbtUint16:
5323
spvType = builder.makeUintType(16);
5324
break;
5325
case glslang::EbtInt64:
5326
spvType = builder.makeIntType(64);
5327
break;
5328
case glslang::EbtUint64:
5329
spvType = builder.makeUintType(64);
5330
break;
5331
case glslang::EbtAtomicUint:
5332
builder.addCapability(spv::Capability::AtomicStorage);
5333
spvType = builder.makeUintType(32);
5334
break;
5335
case glslang::EbtAccStruct:
5336
switch (glslangIntermediate->getStage()) {
5337
case EShLangRayGen:
5338
case EShLangIntersect:
5339
case EShLangAnyHit:
5340
case EShLangClosestHit:
5341
case EShLangMiss:
5342
case EShLangCallable:
5343
// these all should have the RayTracingNV/KHR capability already
5344
break;
5345
default:
5346
{
5347
auto& extensions = glslangIntermediate->getRequestedExtensions();
5348
if (extensions.find("GL_EXT_ray_query") != extensions.end()) {
5349
builder.addExtension(spv::E_SPV_KHR_ray_query);
5350
builder.addCapability(spv::Capability::RayQueryKHR);
5351
}
5352
}
5353
break;
5354
}
5355
spvType = builder.makeAccelerationStructureType();
5356
break;
5357
case glslang::EbtRayQuery:
5358
{
5359
auto& extensions = glslangIntermediate->getRequestedExtensions();
5360
if (extensions.find("GL_EXT_ray_query") != extensions.end()) {
5361
builder.addExtension(spv::E_SPV_KHR_ray_query);
5362
builder.addCapability(spv::Capability::RayQueryKHR);
5363
}
5364
spvType = builder.makeRayQueryType();
5365
}
5366
break;
5367
case glslang::EbtReference:
5368
{
5369
// Make the forward pointer, then recurse to convert the structure type, then
5370
// patch up the forward pointer with a real pointer type.
5371
if (forwardPointers.find(type.getReferentType()) == forwardPointers.end()) {
5372
spv::Id forwardId = builder.makeForwardPointer(spv::StorageClass::PhysicalStorageBufferEXT);
5373
forwardPointers[type.getReferentType()] = forwardId;
5374
}
5375
spvType = forwardPointers[type.getReferentType()];
5376
if (!forwardReferenceOnly) {
5377
spv::Id referentType = convertGlslangToSpvType(*type.getReferentType());
5378
builder.makePointerFromForwardPointer(spv::StorageClass::PhysicalStorageBufferEXT,
5379
forwardPointers[type.getReferentType()],
5380
referentType);
5381
}
5382
}
5383
break;
5384
case glslang::EbtSampler:
5385
{
5386
const glslang::TSampler& sampler = type.getSampler();
5387
std::string debugName;
5388
5389
if (sampler.isPureSampler()) {
5390
if (options.emitNonSemanticShaderDebugInfo) {
5391
if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
5392
debugName = sampler.getString();
5393
}
5394
else {
5395
debugName = "type.sampler";
5396
}
5397
}
5398
spvType = builder.makeSamplerType(debugName.c_str());
5399
} else {
5400
// an image is present, make its type
5401
if (options.emitNonSemanticShaderDebugInfo) {
5402
if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
5403
debugName = sampler.removeCombined().getString();
5404
}
5405
else {
5406
switch (sampler.dim) {
5407
case glslang::Esd1D: debugName = "type.1d.image"; break;
5408
case glslang::Esd2D: debugName = "type.2d.image"; break;
5409
case glslang::Esd3D: debugName = "type.3d.image"; break;
5410
case glslang::EsdCube: debugName = "type.cube.image"; break;
5411
default: debugName = "type.image"; break;
5412
}
5413
}
5414
}
5415
spvType = builder.makeImageType(getSampledType(sampler), TranslateDimensionality(sampler),
5416
sampler.isShadow(), sampler.isArrayed(), sampler.isMultiSample(),
5417
sampler.isImageClass() ? 2 : 1, TranslateImageFormat(type), debugName.c_str());
5418
if (sampler.isCombined() &&
5419
(!sampler.isBuffer() || glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_6)) {
5420
// Already has both image and sampler, make the combined type. Only combine sampler to
5421
// buffer if before SPIR-V 1.6.
5422
if (options.emitNonSemanticShaderDebugInfo) {
5423
if (glslangIntermediate->getSource() == glslang::EShSourceGlsl) {
5424
debugName = sampler.getString();
5425
}
5426
else {
5427
debugName = "type.sampled.image";
5428
}
5429
}
5430
spvType = builder.makeSampledImageType(spvType, debugName.c_str());
5431
}
5432
}
5433
}
5434
break;
5435
case glslang::EbtStruct:
5436
case glslang::EbtBlock:
5437
{
5438
// If we've seen this struct type, return it
5439
const glslang::TTypeList* glslangMembers = type.getStruct();
5440
5441
// Try to share structs for different layouts, but not yet for other
5442
// kinds of qualification (primarily not yet including interpolant qualification).
5443
if (! HasNonLayoutQualifiers(type, qualifier))
5444
spvType = structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers];
5445
if (spvType != spv::NoResult)
5446
break;
5447
5448
// else, we haven't seen it...
5449
if (type.getBasicType() == glslang::EbtBlock)
5450
memberRemapper[glslangTypeToIdMap[glslangMembers]].resize(glslangMembers->size());
5451
spvType = convertGlslangStructToSpvType(type, glslangMembers, explicitLayout, qualifier);
5452
}
5453
break;
5454
case glslang::EbtString:
5455
// no type used for OpString
5456
return 0;
5457
5458
case glslang::EbtHitObjectNV: {
5459
builder.addExtension(spv::E_SPV_NV_shader_invocation_reorder);
5460
builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
5461
spvType = builder.makeHitObjectNVType();
5462
}
5463
break;
5464
5465
case glslang::EbtHitObjectEXT: {
5466
builder.addExtension(spv::E_SPV_EXT_shader_invocation_reorder);
5467
builder.addCapability(spv::Capability::ShaderInvocationReorderEXT);
5468
spvType = builder.makeHitObjectEXTType();
5469
}
5470
break;
5471
case glslang::EbtSpirvType: {
5472
// GL_EXT_spirv_intrinsics
5473
const auto& spirvType = type.getSpirvType();
5474
const auto& spirvInst = spirvType.spirvInst;
5475
5476
std::vector<spv::IdImmediate> operands;
5477
for (const auto& typeParam : spirvType.typeParams) {
5478
if (typeParam.getAsConstant() != nullptr) {
5479
// Constant expression
5480
auto constant = typeParam.getAsConstant();
5481
if (constant->isLiteral()) {
5482
if (constant->getBasicType() == glslang::EbtFloat) {
5483
float floatValue = static_cast<float>(constant->getConstArray()[0].getDConst());
5484
unsigned literal;
5485
static_assert(sizeof(literal) == sizeof(floatValue), "sizeof(unsigned) != sizeof(float)");
5486
memcpy(&literal, &floatValue, sizeof(literal));
5487
operands.push_back({false, literal});
5488
} else if (constant->getBasicType() == glslang::EbtInt) {
5489
unsigned literal = constant->getConstArray()[0].getIConst();
5490
operands.push_back({false, literal});
5491
} else if (constant->getBasicType() == glslang::EbtUint) {
5492
unsigned literal = constant->getConstArray()[0].getUConst();
5493
operands.push_back({false, literal});
5494
} else if (constant->getBasicType() == glslang::EbtBool) {
5495
unsigned literal = constant->getConstArray()[0].getBConst();
5496
operands.push_back({false, literal});
5497
} else if (constant->getBasicType() == glslang::EbtString) {
5498
auto str = constant->getConstArray()[0].getSConst()->c_str();
5499
unsigned literal = 0;
5500
char* literalPtr = reinterpret_cast<char*>(&literal);
5501
unsigned charCount = 0;
5502
char ch = 0;
5503
do {
5504
ch = *(str++);
5505
*(literalPtr++) = ch;
5506
++charCount;
5507
if (charCount == 4) {
5508
operands.push_back({false, literal});
5509
literalPtr = reinterpret_cast<char*>(&literal);
5510
charCount = 0;
5511
}
5512
} while (ch != 0);
5513
5514
// Partial literal is padded with 0
5515
if (charCount > 0) {
5516
for (; charCount < 4; ++charCount)
5517
*(literalPtr++) = 0;
5518
operands.push_back({false, literal});
5519
}
5520
} else
5521
assert(0); // Unexpected type
5522
} else
5523
operands.push_back({true, createSpvConstant(*constant)});
5524
} else {
5525
// Type specifier
5526
assert(typeParam.getAsType() != nullptr);
5527
operands.push_back({true, convertGlslangToSpvType(*typeParam.getAsType())});
5528
}
5529
}
5530
5531
assert(spirvInst.set == ""); // Currently, couldn't be extended instructions.
5532
spvType = builder.makeGenericType(static_cast<spv::Op>(spirvInst.id), operands);
5533
5534
break;
5535
}
5536
case glslang::EbtTensorLayoutNV:
5537
{
5538
builder.addCapability(spv::Capability::TensorAddressingNV);
5539
builder.addExtension(spv::E_SPV_NV_tensor_addressing);
5540
5541
std::vector<spv::IdImmediate> operands;
5542
for (uint32_t i = 0; i < 2; ++i) {
5543
operands.push_back({true, makeArraySizeId(*type.getTypeParameters()->arraySizes, i, true)});
5544
}
5545
spvType = builder.makeGenericType(spv::Op::OpTypeTensorLayoutNV, operands);
5546
break;
5547
}
5548
case glslang::EbtTensorViewNV:
5549
{
5550
builder.addCapability(spv::Capability::TensorAddressingNV);
5551
builder.addExtension(spv::E_SPV_NV_tensor_addressing);
5552
5553
uint32_t dim = type.getTypeParameters()->arraySizes->getDimSize(0);
5554
assert(dim >= 1 && dim <= 5);
5555
std::vector<spv::IdImmediate> operands;
5556
for (uint32_t i = 0; i < dim + 2; ++i) {
5557
operands.push_back({true, makeArraySizeId(*type.getTypeParameters()->arraySizes, i, true, i==1)});
5558
}
5559
spvType = builder.makeGenericType(spv::Op::OpTypeTensorViewNV, operands);
5560
break;
5561
}
5562
default:
5563
assert(0);
5564
break;
5565
}
5566
5567
if (type.isMatrix())
5568
spvType = builder.makeMatrixType(spvType, type.getMatrixCols(), type.getMatrixRows());
5569
else {
5570
// If this variable has a vector element count greater than 1, create a SPIR-V vector
5571
if (type.getVectorSize() > 1)
5572
spvType = builder.makeVectorType(spvType, type.getVectorSize());
5573
}
5574
5575
if (type.isCoopMatNV()) {
5576
builder.addCapability(spv::Capability::CooperativeMatrixNV);
5577
builder.addExtension(spv::E_SPV_NV_cooperative_matrix);
5578
5579
if (type.getBasicType() == glslang::EbtFloat16)
5580
builder.addCapability(spv::Capability::Float16);
5581
if (type.getBasicType() == glslang::EbtUint8 ||
5582
type.getBasicType() == glslang::EbtInt8) {
5583
builder.addCapability(spv::Capability::Int8);
5584
}
5585
5586
spv::Id scope = makeArraySizeId(*type.getTypeParameters()->arraySizes, 1);
5587
spv::Id rows = makeArraySizeId(*type.getTypeParameters()->arraySizes, 2);
5588
spv::Id cols = makeArraySizeId(*type.getTypeParameters()->arraySizes, 3);
5589
5590
spvType = builder.makeCooperativeMatrixTypeNV(spvType, scope, rows, cols);
5591
}
5592
5593
if (type.isCoopMatKHR()) {
5594
builder.addCapability(spv::Capability::CooperativeMatrixKHR);
5595
builder.addExtension(spv::E_SPV_KHR_cooperative_matrix);
5596
5597
if (type.getBasicType() == glslang::EbtBFloat16) {
5598
builder.addExtension(spv::E_SPV_KHR_bfloat16);
5599
builder.addCapability(spv::Capability::BFloat16CooperativeMatrixKHR);
5600
}
5601
5602
if (type.getBasicType() == glslang::EbtFloatE5M2 || type.getBasicType() == glslang::EbtFloatE4M3) {
5603
builder.addExtension(spv::E_SPV_EXT_float8);
5604
builder.addCapability(spv::Capability::Float8CooperativeMatrixEXT);
5605
}
5606
5607
if (type.getBasicType() == glslang::EbtFloat16)
5608
builder.addCapability(spv::Capability::Float16);
5609
if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {
5610
builder.addCapability(spv::Capability::Int8);
5611
}
5612
5613
spv::Id scope = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
5614
spv::Id rows = makeArraySizeId(*type.getTypeParameters()->arraySizes, 1);
5615
spv::Id cols = makeArraySizeId(*type.getTypeParameters()->arraySizes, 2);
5616
spv::Id use = makeArraySizeId(*type.getTypeParameters()->arraySizes, 3, true);
5617
5618
spvType = builder.makeCooperativeMatrixTypeKHR(spvType, scope, rows, cols, use);
5619
}
5620
else if (type.isTensorARM()) {
5621
builder.addCapability(spv::Capability::TensorsARM);
5622
builder.addExtension(spv::E_SPV_ARM_tensors);
5623
if (type.getBasicType() == glslang::EbtInt8 || type.getBasicType() == glslang::EbtUint8) {
5624
builder.addCapability(spv::Capability::Int8);
5625
} else if (type.getBasicType() == glslang::EbtInt16 ||
5626
type.getBasicType() == glslang::EbtUint16) {
5627
builder.addCapability(spv::Capability::Int16);
5628
} else if (type.getBasicType() == glslang::EbtInt64 ||
5629
type.getBasicType() == glslang::EbtUint64) {
5630
builder.addCapability(spv::Capability::Int64);
5631
} else if (type.getBasicType() == glslang::EbtFloat16) {
5632
builder.addCapability(spv::Capability::Float16);
5633
}
5634
5635
spv::Id rank = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
5636
5637
spvType = builder.makeTensorTypeARM(spvType, rank);
5638
}
5639
5640
if (type.isCoopVecNV()) {
5641
builder.addCapability(spv::Capability::CooperativeVectorNV);
5642
builder.addExtension(spv::E_SPV_NV_cooperative_vector);
5643
5644
if (type.getBasicType() == glslang::EbtFloat16)
5645
builder.addCapability(spv::Capability::Float16);
5646
if (type.getBasicType() == glslang::EbtUint8 || type.getBasicType() == glslang::EbtInt8) {
5647
builder.addCapability(spv::Capability::Int8);
5648
}
5649
5650
spv::Id components = makeArraySizeId(*type.getTypeParameters()->arraySizes, 0);
5651
5652
spvType = builder.makeCooperativeVectorTypeNV(spvType, components);
5653
}
5654
5655
if (type.isArray()) {
5656
int stride = 0; // keep this 0 unless doing an explicit layout; 0 will mean no decoration, no stride
5657
5658
// Do all but the outer dimension
5659
if (type.getArraySizes()->getNumDims() > 1) {
5660
// We need to decorate array strides for types needing explicit layout, except blocks.
5661
if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock) {
5662
// Use a dummy glslang type for querying internal strides of
5663
// arrays of arrays, but using just a one-dimensional array.
5664
glslang::TType simpleArrayType(type, 0); // deference type of the array
5665
while (simpleArrayType.getArraySizes()->getNumDims() > 1)
5666
simpleArrayType.getArraySizes()->dereference();
5667
5668
// Will compute the higher-order strides here, rather than making a whole
5669
// pile of types and doing repetitive recursion on their contents.
5670
stride = getArrayStride(simpleArrayType, explicitLayout, qualifier.layoutMatrix);
5671
}
5672
5673
// make the arrays
5674
for (int dim = type.getArraySizes()->getNumDims() - 1; dim > 0; --dim) {
5675
spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), dim), stride);
5676
if (stride > 0)
5677
builder.addDecoration(spvType, spv::Decoration::ArrayStride, stride);
5678
stride *= type.getArraySizes()->getDimSize(dim);
5679
}
5680
} else {
5681
// single-dimensional array, and don't yet have stride
5682
5683
// We need to decorate array strides for types needing explicit layout, except blocks.
5684
if (explicitLayout != glslang::ElpNone && type.getBasicType() != glslang::EbtBlock)
5685
stride = getArrayStride(type, explicitLayout, qualifier.layoutMatrix);
5686
}
5687
5688
// Do the outer dimension, which might not be known for a runtime-sized array.
5689
// (Unsized arrays that survive through linking will be runtime-sized arrays)
5690
if (type.isSizedArray())
5691
spvType = builder.makeArrayType(spvType, makeArraySizeId(*type.getArraySizes(), 0), stride);
5692
else {
5693
// If we see an runtime array in a buffer_reference, it is not a descriptor
5694
if (!lastBufferBlockMember && type.getBasicType() != glslang::EbtReference) {
5695
builder.addIncorporatedExtension("SPV_EXT_descriptor_indexing", spv::Spv_1_5);
5696
builder.addCapability(spv::Capability::RuntimeDescriptorArrayEXT);
5697
}
5698
spvType = builder.makeRuntimeArray(spvType);
5699
}
5700
if (stride > 0)
5701
builder.addDecoration(spvType, spv::Decoration::ArrayStride, stride);
5702
}
5703
5704
return spvType;
5705
}
5706
5707
// Apply SPIR-V decorations to the SPIR-V object (provided by SPIR-V ID). If member index is provided, the
5708
// decorations are applied to this member.
5709
void TGlslangToSpvTraverser::applySpirvDecorate(const glslang::TType& type, spv::Id id, std::optional<int> member)
5710
{
5711
assert(type.getQualifier().hasSpirvDecorate());
5712
5713
const glslang::TSpirvDecorate& spirvDecorate = type.getQualifier().getSpirvDecorate();
5714
5715
// Add spirv_decorate
5716
for (auto& decorate : spirvDecorate.decorates) {
5717
if (!decorate.second.empty()) {
5718
std::vector<unsigned> literals;
5719
TranslateLiterals(decorate.second, literals);
5720
if (member.has_value())
5721
builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorate.first), literals);
5722
else
5723
builder.addDecoration(id, static_cast<spv::Decoration>(decorate.first), literals);
5724
} else {
5725
if (member.has_value())
5726
builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorate.first));
5727
else
5728
builder.addDecoration(id, static_cast<spv::Decoration>(decorate.first));
5729
}
5730
}
5731
5732
// Add spirv_decorate_id
5733
if (member.has_value()) {
5734
// spirv_decorate_id not applied to members
5735
assert(spirvDecorate.decorateIds.empty());
5736
} else {
5737
for (auto& decorateId : spirvDecorate.decorateIds) {
5738
std::vector<spv::Id> operandIds;
5739
assert(!decorateId.second.empty());
5740
for (auto extraOperand : decorateId.second) {
5741
if (extraOperand->getQualifier().isFrontEndConstant())
5742
operandIds.push_back(createSpvConstant(*extraOperand));
5743
else
5744
operandIds.push_back(getSymbolId(extraOperand->getAsSymbolNode()));
5745
}
5746
builder.addDecorationId(id, static_cast<spv::Decoration>(decorateId.first), operandIds);
5747
}
5748
}
5749
5750
// Add spirv_decorate_string
5751
for (auto& decorateString : spirvDecorate.decorateStrings) {
5752
std::vector<const char*> strings;
5753
assert(!decorateString.second.empty());
5754
for (auto extraOperand : decorateString.second) {
5755
const char* string = extraOperand->getConstArray()[0].getSConst()->c_str();
5756
strings.push_back(string);
5757
}
5758
if (member.has_value())
5759
builder.addMemberDecoration(id, *member, static_cast<spv::Decoration>(decorateString.first), strings);
5760
else
5761
builder.addDecoration(id, static_cast<spv::Decoration>(decorateString.first), strings);
5762
}
5763
}
5764
5765
// TODO: this functionality should exist at a higher level, in creating the AST
5766
//
5767
// Identify interface members that don't have their required extension turned on.
5768
//
5769
bool TGlslangToSpvTraverser::filterMember(const glslang::TType& member)
5770
{
5771
auto& extensions = glslangIntermediate->getRequestedExtensions();
5772
5773
if (member.getFieldName() == "gl_SecondaryViewportMaskNV" &&
5774
extensions.find("GL_NV_stereo_view_rendering") == extensions.end())
5775
return true;
5776
if (member.getFieldName() == "gl_SecondaryPositionNV" &&
5777
extensions.find("GL_NV_stereo_view_rendering") == extensions.end())
5778
return true;
5779
5780
if (glslangIntermediate->getStage() == EShLangMesh) {
5781
if (member.getFieldName() == "gl_PrimitiveShadingRateEXT" &&
5782
extensions.find("GL_EXT_fragment_shading_rate") == extensions.end())
5783
return true;
5784
}
5785
5786
if (glslangIntermediate->getStage() != EShLangMesh) {
5787
if (member.getFieldName() == "gl_ViewportMask" &&
5788
extensions.find("GL_NV_viewport_array2") == extensions.end())
5789
return true;
5790
if (member.getFieldName() == "gl_PositionPerViewNV" &&
5791
extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())
5792
return true;
5793
if (member.getFieldName() == "gl_ViewportMaskPerViewNV" &&
5794
extensions.find("GL_NVX_multiview_per_view_attributes") == extensions.end())
5795
return true;
5796
}
5797
5798
return false;
5799
}
5800
5801
// Do full recursive conversion of a glslang structure (or block) type to a SPIR-V Id.
5802
// explicitLayout can be kept the same throughout the hierarchical recursive walk.
5803
// Mutually recursive with convertGlslangToSpvType().
5804
spv::Id TGlslangToSpvTraverser::convertGlslangStructToSpvType(const glslang::TType& type,
5805
const glslang::TTypeList* glslangMembers,
5806
glslang::TLayoutPacking explicitLayout,
5807
const glslang::TQualifier& qualifier)
5808
{
5809
// Create a vector of struct types for SPIR-V to consume
5810
std::vector<spv::Id> spvMembers;
5811
int memberDelta = 0; // how much the member's index changes from glslang to SPIR-V, normally 0,
5812
// except sometimes for blocks
5813
std::vector<std::pair<glslang::TType*, glslang::TQualifier> > deferredForwardPointers;
5814
std::vector<spv::StructMemberDebugInfo> memberDebugInfo;
5815
for (int i = 0; i < (int)glslangMembers->size(); i++) {
5816
auto& glslangMember = (*glslangMembers)[i];
5817
if (glslangMember.type->hiddenMember()) {
5818
++memberDelta;
5819
if (type.getBasicType() == glslang::EbtBlock)
5820
memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = -1;
5821
} else {
5822
if (type.getBasicType() == glslang::EbtBlock) {
5823
if (filterMember(*glslangMember.type)) {
5824
memberDelta++;
5825
memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = -1;
5826
continue;
5827
}
5828
memberRemapper[glslangTypeToIdMap[glslangMembers]][i] = i - memberDelta;
5829
}
5830
// modify just this child's view of the qualifier
5831
glslang::TQualifier memberQualifier = glslangMember.type->getQualifier();
5832
InheritQualifiers(memberQualifier, qualifier);
5833
5834
// manually inherit location
5835
if (! memberQualifier.hasLocation() && qualifier.hasLocation())
5836
memberQualifier.layoutLocation = qualifier.layoutLocation;
5837
5838
// recurse
5839
bool lastBufferBlockMember = qualifier.storage == glslang::EvqBuffer &&
5840
i == (int)glslangMembers->size() - 1;
5841
5842
// Make forward pointers for any pointer members.
5843
if (glslangMember.type->isReference() &&
5844
forwardPointers.find(glslangMember.type->getReferentType()) == forwardPointers.end()) {
5845
deferredForwardPointers.push_back(std::make_pair(glslangMember.type, memberQualifier));
5846
}
5847
5848
// Create the member type.
5849
auto const spvMember = convertGlslangToSpvType(*glslangMember.type, explicitLayout, memberQualifier, lastBufferBlockMember,
5850
glslangMember.type->isReference());
5851
spvMembers.push_back(spvMember);
5852
5853
// Update the builder with the type's location so that we can create debug types for the structure members.
5854
// There doesn't exist a "clean" entry point for this information to be passed along to the builder so, for now,
5855
// it is stored in the builder and consumed during the construction of composite debug types.
5856
// TODO: This probably warrants further investigation. This approach was decided to be the least ugly of the
5857
// quick and dirty approaches that were tried.
5858
// Advantages of this approach:
5859
// + Relatively clean. No direct calls into debug type system.
5860
// + Handles nested recursive structures.
5861
// Disadvantages of this approach:
5862
// + Not as clean as desired. Traverser queries/sets persistent state. This is fragile.
5863
// + Table lookup during creation of composite debug types. This really shouldn't be necessary.
5864
if(options.emitNonSemanticShaderDebugInfo) {
5865
spv::StructMemberDebugInfo debugInfo{};
5866
debugInfo.name = glslangMember.type->getFieldName();
5867
debugInfo.line = glslangMember.loc.line;
5868
debugInfo.column = glslangMember.loc.column;
5869
5870
// Per the GLSL spec, bool variables inside of a uniform or buffer block are generated as uint.
5871
// But for debug info, we want to represent them as bool because that is the original type in
5872
// the source code. The bool type can be nested within a vector or a multidimensional array,
5873
// so we must construct the chain of types up from the scalar bool.
5874
if (glslangIntermediate->getSource() == glslang::EShSourceGlsl && explicitLayout != glslang::ElpNone &&
5875
glslangMember.type->getBasicType() == glslang::EbtBool) {
5876
auto typeId = builder.makeBoolType();
5877
if (glslangMember.type->isVector()) {
5878
typeId = builder.makeVectorType(typeId, glslangMember.type->getVectorSize());
5879
}
5880
if (glslangMember.type->isArray()) {
5881
const auto* arraySizes = glslangMember.type->getArraySizes();
5882
int dims = arraySizes->getNumDims();
5883
for (int i = dims - 1; i >= 0; --i) {
5884
spv::Id size = builder.makeIntConstant(arraySizes->getDimSize(i));
5885
typeId = builder.makeArrayType(typeId, size, 0);
5886
}
5887
}
5888
debugInfo.debugTypeOverride = builder.getDebugType(typeId);
5889
}
5890
5891
memberDebugInfo.push_back(debugInfo);
5892
}
5893
}
5894
}
5895
5896
// Make the SPIR-V type
5897
spv::Id spvType = builder.makeStructType(spvMembers, memberDebugInfo, type.getTypeName().c_str(), false);
5898
if (! HasNonLayoutQualifiers(type, qualifier))
5899
structMap[explicitLayout][qualifier.layoutMatrix][glslangMembers] = spvType;
5900
5901
// Decorate it
5902
decorateStructType(type, glslangMembers, explicitLayout, qualifier, spvType, spvMembers);
5903
5904
for (int i = 0; i < (int)deferredForwardPointers.size(); ++i) {
5905
auto it = deferredForwardPointers[i];
5906
convertGlslangToSpvType(*it.first, explicitLayout, it.second, false);
5907
}
5908
5909
return spvType;
5910
}
5911
5912
void TGlslangToSpvTraverser::decorateStructType(const glslang::TType& type,
5913
const glslang::TTypeList* glslangMembers,
5914
glslang::TLayoutPacking explicitLayout,
5915
const glslang::TQualifier& qualifier,
5916
spv::Id spvType,
5917
const std::vector<spv::Id>& spvMembers)
5918
{
5919
// Name and decorate the non-hidden members
5920
int offset = -1;
5921
bool memberLocationInvalid = type.isArrayOfArrays() ||
5922
(type.isArray() && (type.getQualifier().isArrayedIo(glslangIntermediate->getStage()) == false));
5923
for (int i = 0; i < (int)glslangMembers->size(); i++) {
5924
glslang::TType& glslangMember = *(*glslangMembers)[i].type;
5925
int member = i;
5926
if (type.getBasicType() == glslang::EbtBlock) {
5927
member = memberRemapper[glslangTypeToIdMap[glslangMembers]][i];
5928
if (filterMember(glslangMember))
5929
continue;
5930
}
5931
5932
// modify just this child's view of the qualifier
5933
glslang::TQualifier memberQualifier = glslangMember.getQualifier();
5934
InheritQualifiers(memberQualifier, qualifier);
5935
5936
// using -1 above to indicate a hidden member
5937
if (member < 0)
5938
continue;
5939
5940
builder.addMemberName(spvType, member, glslangMember.getFieldName().c_str());
5941
builder.addMemberDecoration(spvType, member,
5942
TranslateLayoutDecoration(glslangMember, memberQualifier.layoutMatrix));
5943
builder.addMemberDecoration(spvType, member, TranslatePrecisionDecoration(glslangMember));
5944
// Add interpolation and auxiliary storage decorations only to
5945
// top-level members of Input and Output storage classes
5946
if (type.getQualifier().storage == glslang::EvqVaryingIn ||
5947
type.getQualifier().storage == glslang::EvqVaryingOut) {
5948
if (type.getBasicType() == glslang::EbtBlock ||
5949
glslangIntermediate->getSource() == glslang::EShSourceHlsl) {
5950
builder.addMemberDecoration(spvType, member, TranslateInterpolationDecoration(memberQualifier));
5951
builder.addMemberDecoration(spvType, member, TranslateAuxiliaryStorageDecoration(memberQualifier));
5952
addMeshNVDecoration(spvType, member, memberQualifier);
5953
}
5954
}
5955
builder.addMemberDecoration(spvType, member, TranslateInvariantDecoration(memberQualifier));
5956
5957
if (type.getBasicType() == glslang::EbtBlock &&
5958
qualifier.storage == glslang::EvqBuffer) {
5959
// Add memory decorations only to top-level members of shader storage block
5960
std::vector<spv::Decoration> memory;
5961
TranslateMemoryDecoration(memberQualifier, memory, glslangIntermediate->usingVulkanMemoryModel());
5962
for (unsigned int i = 0; i < memory.size(); ++i)
5963
builder.addMemberDecoration(spvType, member, memory[i]);
5964
}
5965
5966
// Location assignment was already completed correctly by the front end,
5967
// just track whether a member needs to be decorated.
5968
// Ignore member locations if the container is an array, as that's
5969
// ill-specified and decisions have been made to not allow this.
5970
if (!memberLocationInvalid && memberQualifier.hasLocation())
5971
builder.addMemberDecoration(spvType, member, spv::Decoration::Location, memberQualifier.layoutLocation);
5972
5973
// component, XFB, others
5974
if (glslangMember.getQualifier().hasComponent())
5975
builder.addMemberDecoration(spvType, member, spv::Decoration::Component,
5976
glslangMember.getQualifier().layoutComponent);
5977
if (glslangMember.getQualifier().hasXfbOffset())
5978
builder.addMemberDecoration(spvType, member, spv::Decoration::Offset,
5979
glslangMember.getQualifier().layoutXfbOffset);
5980
else if (explicitLayout != glslang::ElpNone) {
5981
// figure out what to do with offset, which is accumulating
5982
int nextOffset;
5983
updateMemberOffset(type, glslangMember, offset, nextOffset, explicitLayout, memberQualifier.layoutMatrix);
5984
if (offset >= 0)
5985
builder.addMemberDecoration(spvType, member, spv::Decoration::Offset, offset);
5986
offset = nextOffset;
5987
}
5988
5989
if (glslangMember.isMatrix() && explicitLayout != glslang::ElpNone)
5990
builder.addMemberDecoration(spvType, member, spv::Decoration::MatrixStride,
5991
getMatrixStride(glslangMember, explicitLayout, memberQualifier.layoutMatrix));
5992
5993
// built-in variable decorations
5994
spv::BuiltIn builtIn = TranslateBuiltInDecoration(glslangMember.getQualifier().builtIn, true);
5995
if (builtIn != spv::BuiltIn::Max)
5996
builder.addMemberDecoration(spvType, member, spv::Decoration::BuiltIn, (int)builtIn);
5997
5998
// nonuniform
5999
builder.addMemberDecoration(spvType, member, TranslateNonUniformDecoration(glslangMember.getQualifier()));
6000
6001
if (glslangIntermediate->getHlslFunctionality1() && memberQualifier.semanticName != nullptr) {
6002
builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
6003
builder.addMemberDecoration(spvType, member, spv::Decoration::HlslSemanticGOOGLE,
6004
memberQualifier.semanticName);
6005
}
6006
6007
if (builtIn == spv::BuiltIn::Layer) {
6008
// SPV_NV_viewport_array2 extension
6009
if (glslangMember.getQualifier().layoutViewportRelative){
6010
builder.addMemberDecoration(spvType, member, spv::Decoration::ViewportRelativeNV);
6011
builder.addCapability(spv::Capability::ShaderViewportMaskNV);
6012
builder.addExtension(spv::E_SPV_NV_viewport_array2);
6013
}
6014
if (glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset != -2048){
6015
builder.addMemberDecoration(spvType, member,
6016
spv::Decoration::SecondaryViewportRelativeNV,
6017
glslangMember.getQualifier().layoutSecondaryViewportRelativeOffset);
6018
builder.addCapability(spv::Capability::ShaderStereoViewNV);
6019
builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
6020
}
6021
}
6022
if (glslangMember.getQualifier().layoutPassthrough) {
6023
builder.addMemberDecoration(spvType, member, spv::Decoration::PassthroughNV);
6024
builder.addCapability(spv::Capability::GeometryShaderPassthroughNV);
6025
builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);
6026
}
6027
6028
// Add SPIR-V decorations (GL_EXT_spirv_intrinsics)
6029
if (glslangMember.getQualifier().hasSpirvDecorate())
6030
applySpirvDecorate(glslangMember, spvType, member);
6031
}
6032
6033
// Decorate the structure
6034
builder.addDecoration(spvType, TranslateLayoutDecoration(type, qualifier.layoutMatrix));
6035
const auto basicType = type.getBasicType();
6036
const auto typeStorageQualifier = type.getQualifier().storage;
6037
if (basicType == glslang::EbtBlock) {
6038
builder.addDecoration(spvType, TranslateBlockDecoration(typeStorageQualifier, glslangIntermediate->usingStorageBuffer()));
6039
} else if (basicType == glslang::EbtStruct && glslangIntermediate->getSpv().vulkan > 0) {
6040
const auto hasRuntimeArray = !spvMembers.empty() && builder.getOpCode(spvMembers.back()) == spv::Op::OpTypeRuntimeArray;
6041
if (hasRuntimeArray) {
6042
builder.addDecoration(spvType, TranslateBlockDecoration(typeStorageQualifier, glslangIntermediate->usingStorageBuffer()));
6043
}
6044
}
6045
6046
if (qualifier.hasHitObjectShaderRecordNV())
6047
builder.addDecoration(spvType, spv::Decoration::HitObjectShaderRecordBufferNV);
6048
if (qualifier.hasHitObjectShaderRecordEXT())
6049
builder.addDecoration(spvType, spv::Decoration::HitObjectShaderRecordBufferEXT);
6050
}
6051
6052
// Turn the expression forming the array size into an id.
6053
// This is not quite trivial, because of specialization constants.
6054
// Sometimes, a raw constant is turned into an Id, and sometimes
6055
// a specialization constant expression is.
6056
spv::Id TGlslangToSpvTraverser::makeArraySizeId(const glslang::TArraySizes& arraySizes, int dim, bool allowZero, bool boolType)
6057
{
6058
// First, see if this is sized with a node, meaning a specialization constant:
6059
glslang::TIntermTyped* specNode = arraySizes.getDimNode(dim);
6060
if (specNode != nullptr) {
6061
builder.clearAccessChain();
6062
SpecConstantOpModeGuard spec_constant_op_mode_setter(&builder);
6063
spec_constant_op_mode_setter.turnOnSpecConstantOpMode();
6064
specNode->traverse(this);
6065
return accessChainLoad(specNode->getAsTyped()->getType());
6066
}
6067
6068
// Otherwise, need a compile-time (front end) size, get it:
6069
int size = arraySizes.getDimSize(dim);
6070
6071
if (!allowZero)
6072
assert(size > 0);
6073
6074
if (boolType) {
6075
return builder.makeBoolConstant(size);
6076
} else {
6077
return builder.makeUintConstant(size);
6078
}
6079
}
6080
6081
// Wrap the builder's accessChainLoad to:
6082
// - localize handling of RelaxedPrecision
6083
// - use the SPIR-V inferred type instead of another conversion of the glslang type
6084
// (avoids unnecessary work and possible type punning for structures)
6085
// - do conversion of concrete to abstract type
6086
spv::Id TGlslangToSpvTraverser::accessChainLoad(const glslang::TType& type)
6087
{
6088
spv::Id nominalTypeId = builder.accessChainGetInferredType();
6089
6090
spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
6091
coherentFlags |= TranslateCoherent(type);
6092
6093
spv::MemoryAccessMask accessMask = spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) & ~spv::MemoryAccessMask::MakePointerAvailableKHR);
6094
// If the value being loaded is HelperInvocation, SPIR-V 1.6 is being generated (so that
6095
// SPV_EXT_demote_to_helper_invocation is in core) and the memory model is in use, add
6096
// the Volatile MemoryAccess semantic.
6097
if (type.getQualifier().builtIn == glslang::EbvHelperInvocation &&
6098
glslangIntermediate->usingVulkanMemoryModel() &&
6099
glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
6100
accessMask = spv::MemoryAccessMask(accessMask | spv::MemoryAccessMask::Volatile);
6101
}
6102
6103
unsigned int alignment = builder.getAccessChain().alignment;
6104
alignment |= type.getBufferReferenceAlignment();
6105
6106
spv::Id loadedId = builder.accessChainLoad(TranslatePrecisionDecoration(type),
6107
TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags),
6108
TranslateNonUniformDecoration(type.getQualifier()),
6109
nominalTypeId,
6110
accessMask,
6111
TranslateMemoryScope(coherentFlags),
6112
alignment);
6113
6114
// Need to convert to abstract types when necessary
6115
if (type.getBasicType() == glslang::EbtBool) {
6116
loadedId = convertLoadedBoolInUniformToUint(type, nominalTypeId, loadedId);
6117
}
6118
6119
return loadedId;
6120
}
6121
6122
// Wrap the builder's accessChainStore to:
6123
// - do conversion of concrete to abstract type
6124
//
6125
// Implicitly uses the existing builder.accessChain as the storage target.
6126
void TGlslangToSpvTraverser::accessChainStore(const glslang::TType& type, spv::Id rvalue)
6127
{
6128
// Need to convert to abstract types when necessary
6129
if (type.getBasicType() == glslang::EbtBool) {
6130
spv::Id nominalTypeId = builder.accessChainGetInferredType();
6131
6132
if (builder.isScalarType(nominalTypeId)) {
6133
// Conversion for bool
6134
spv::Id boolType = builder.makeBoolType();
6135
if (nominalTypeId != boolType) {
6136
// keep these outside arguments, for determinant order-of-evaluation
6137
spv::Id one = builder.makeUintConstant(1);
6138
spv::Id zero = builder.makeUintConstant(0);
6139
rvalue = builder.createTriOp(spv::Op::OpSelect, nominalTypeId, rvalue, one, zero);
6140
} else if (builder.getTypeId(rvalue) != boolType)
6141
rvalue = builder.createBinOp(spv::Op::OpINotEqual, boolType, rvalue, builder.makeUintConstant(0));
6142
} else if (builder.isVectorType(nominalTypeId)) {
6143
// Conversion for bvec
6144
int vecSize = builder.getNumTypeComponents(nominalTypeId);
6145
spv::Id bvecType = builder.makeVectorType(builder.makeBoolType(), vecSize);
6146
if (nominalTypeId != bvecType) {
6147
// keep these outside arguments, for determinant order-of-evaluation
6148
spv::Id one = makeSmearedConstant(builder.makeUintConstant(1), vecSize);
6149
spv::Id zero = makeSmearedConstant(builder.makeUintConstant(0), vecSize);
6150
rvalue = builder.createTriOp(spv::Op::OpSelect, nominalTypeId, rvalue, one, zero);
6151
} else if (builder.getTypeId(rvalue) != bvecType)
6152
rvalue = builder.createBinOp(spv::Op::OpINotEqual, bvecType, rvalue,
6153
makeSmearedConstant(builder.makeUintConstant(0), vecSize));
6154
}
6155
}
6156
6157
spv::Builder::AccessChain::CoherentFlags coherentFlags = builder.getAccessChain().coherentFlags;
6158
coherentFlags |= TranslateCoherent(type);
6159
6160
unsigned int alignment = builder.getAccessChain().alignment;
6161
alignment |= type.getBufferReferenceAlignment();
6162
6163
builder.accessChainStore(rvalue, TranslateNonUniformDecoration(builder.getAccessChain().coherentFlags),
6164
spv::MemoryAccessMask(TranslateMemoryAccess(coherentFlags) &
6165
~spv::MemoryAccessMask::MakePointerVisibleKHR),
6166
TranslateMemoryScope(coherentFlags), alignment);
6167
}
6168
6169
// For storing when types match at the glslang level, but not might match at the
6170
// SPIR-V level.
6171
//
6172
// This especially happens when a single glslang type expands to multiple
6173
// SPIR-V types, like a struct that is used in a member-undecorated way as well
6174
// as in a member-decorated way.
6175
//
6176
// NOTE: This function can handle any store request; if it's not special it
6177
// simplifies to a simple OpStore.
6178
//
6179
// Implicitly uses the existing builder.accessChain as the storage target.
6180
void TGlslangToSpvTraverser::multiTypeStore(const glslang::TType& type, spv::Id rValue)
6181
{
6182
// we only do the complex path here if it's an aggregate
6183
if (! type.isStruct() && ! type.isArray()) {
6184
accessChainStore(type, rValue);
6185
return;
6186
}
6187
6188
// and, it has to be a case of type aliasing
6189
spv::Id rType = builder.getTypeId(rValue);
6190
spv::Id lValue = builder.accessChainGetLValue();
6191
spv::Id lType = builder.getContainedTypeId(builder.getTypeId(lValue));
6192
if (lType == rType) {
6193
accessChainStore(type, rValue);
6194
return;
6195
}
6196
6197
// Recursively (as needed) copy an aggregate type to a different aggregate type,
6198
// where the two types were the same type in GLSL. This requires member
6199
// by member copy, recursively.
6200
6201
// SPIR-V 1.4 added an instruction to do help do this.
6202
if (glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
6203
// However, bool in uniform space is changed to int, so
6204
// OpCopyLogical does not work for that.
6205
// TODO: It would be more robust to do a full recursive verification of the types satisfying SPIR-V rules.
6206
bool rBool = builder.containsType(builder.getTypeId(rValue), spv::Op::OpTypeBool, 0);
6207
bool lBool = builder.containsType(lType, spv::Op::OpTypeBool, 0);
6208
if (lBool == rBool) {
6209
spv::Id logicalCopy = builder.createUnaryOp(spv::Op::OpCopyLogical, lType, rValue);
6210
accessChainStore(type, logicalCopy);
6211
return;
6212
}
6213
}
6214
6215
// If an array, copy element by element.
6216
if (type.isArray()) {
6217
glslang::TType glslangElementType(type, 0);
6218
spv::Id elementRType = builder.getContainedTypeId(rType);
6219
for (int index = 0; index < type.getOuterArraySize(); ++index) {
6220
// get the source member
6221
spv::Id elementRValue = builder.createCompositeExtract(rValue, elementRType, index);
6222
6223
// set up the target storage
6224
builder.clearAccessChain();
6225
builder.setAccessChainLValue(lValue);
6226
builder.accessChainPush(builder.makeIntConstant(index), TranslateCoherent(type),
6227
type.getBufferReferenceAlignment());
6228
6229
// store the member
6230
multiTypeStore(glslangElementType, elementRValue);
6231
}
6232
} else {
6233
assert(type.isStruct());
6234
6235
// loop over structure members
6236
const glslang::TTypeList& members = *type.getStruct();
6237
for (int m = 0; m < (int)members.size(); ++m) {
6238
const glslang::TType& glslangMemberType = *members[m].type;
6239
6240
// get the source member
6241
spv::Id memberRType = builder.getContainedTypeId(rType, m);
6242
spv::Id memberRValue = builder.createCompositeExtract(rValue, memberRType, m);
6243
6244
// set up the target storage
6245
builder.clearAccessChain();
6246
builder.setAccessChainLValue(lValue);
6247
builder.accessChainPush(builder.makeIntConstant(m), TranslateCoherent(type),
6248
type.getBufferReferenceAlignment());
6249
6250
// store the member
6251
multiTypeStore(glslangMemberType, memberRValue);
6252
}
6253
}
6254
}
6255
6256
// Decide whether or not this type should be
6257
// decorated with offsets and strides, and if so
6258
// whether std140 or std430 rules should be applied.
6259
glslang::TLayoutPacking TGlslangToSpvTraverser::getExplicitLayout(const glslang::TType& type) const
6260
{
6261
// has to be a block
6262
if (type.getBasicType() != glslang::EbtBlock)
6263
return glslang::ElpNone;
6264
6265
// has to be a uniform or buffer block or task in/out blocks
6266
if (type.getQualifier().storage != glslang::EvqUniform &&
6267
type.getQualifier().storage != glslang::EvqBuffer &&
6268
type.getQualifier().storage != glslang::EvqShared &&
6269
!type.getQualifier().isTaskMemory())
6270
return glslang::ElpNone;
6271
6272
// return the layout to use
6273
switch (type.getQualifier().layoutPacking) {
6274
case glslang::ElpStd140:
6275
case glslang::ElpStd430:
6276
case glslang::ElpScalar:
6277
return type.getQualifier().layoutPacking;
6278
default:
6279
return glslang::ElpNone;
6280
}
6281
}
6282
6283
// Given an array type, returns the integer stride required for that array
6284
int TGlslangToSpvTraverser::getArrayStride(const glslang::TType& arrayType, glslang::TLayoutPacking explicitLayout,
6285
glslang::TLayoutMatrix matrixLayout)
6286
{
6287
int size;
6288
int stride;
6289
glslangIntermediate->getMemberAlignment(arrayType, size, stride, explicitLayout,
6290
matrixLayout == glslang::ElmRowMajor);
6291
6292
return stride;
6293
}
6294
6295
// Given a matrix type, or array (of array) of matrixes type, returns the integer stride required for that matrix
6296
// when used as a member of an interface block
6297
int TGlslangToSpvTraverser::getMatrixStride(const glslang::TType& matrixType, glslang::TLayoutPacking explicitLayout,
6298
glslang::TLayoutMatrix matrixLayout)
6299
{
6300
glslang::TType elementType;
6301
elementType.shallowCopy(matrixType);
6302
elementType.clearArraySizes();
6303
6304
int size;
6305
int stride;
6306
glslangIntermediate->getMemberAlignment(elementType, size, stride, explicitLayout,
6307
matrixLayout == glslang::ElmRowMajor);
6308
6309
return stride;
6310
}
6311
6312
// Given a member type of a struct, realign the current offset for it, and compute
6313
// the next (not yet aligned) offset for the next member, which will get aligned
6314
// on the next call.
6315
// 'currentOffset' should be passed in already initialized, ready to modify, and reflecting
6316
// the migration of data from nextOffset -> currentOffset. It should be -1 on the first call.
6317
// -1 means a non-forced member offset (no decoration needed).
6318
void TGlslangToSpvTraverser::updateMemberOffset(const glslang::TType& structType, const glslang::TType& memberType,
6319
int& currentOffset, int& nextOffset, glslang::TLayoutPacking explicitLayout, glslang::TLayoutMatrix matrixLayout)
6320
{
6321
// this will get a positive value when deemed necessary
6322
nextOffset = -1;
6323
6324
// override anything in currentOffset with user-set offset
6325
if (memberType.getQualifier().hasOffset())
6326
currentOffset = memberType.getQualifier().layoutOffset;
6327
6328
// It could be that current linker usage in glslang updated all the layoutOffset,
6329
// in which case the following code does not matter. But, that's not quite right
6330
// once cross-compilation unit GLSL validation is done, as the original user
6331
// settings are needed in layoutOffset, and then the following will come into play.
6332
6333
if (explicitLayout == glslang::ElpNone) {
6334
if (! memberType.getQualifier().hasOffset())
6335
currentOffset = -1;
6336
6337
return;
6338
}
6339
6340
// Getting this far means we need explicit offsets
6341
if (currentOffset < 0)
6342
currentOffset = 0;
6343
6344
// Now, currentOffset is valid (either 0, or from a previous nextOffset),
6345
// but possibly not yet correctly aligned.
6346
6347
int memberSize;
6348
int dummyStride;
6349
int memberAlignment = glslangIntermediate->getMemberAlignment(memberType, memberSize, dummyStride, explicitLayout,
6350
matrixLayout == glslang::ElmRowMajor);
6351
6352
bool isVectorLike = memberType.isVector();
6353
if (memberType.isMatrix()) {
6354
if (matrixLayout == glslang::ElmRowMajor)
6355
isVectorLike = memberType.getMatrixRows() == 1;
6356
else
6357
isVectorLike = memberType.getMatrixCols() == 1;
6358
}
6359
6360
// Adjust alignment for HLSL rules
6361
// TODO: make this consistent in early phases of code:
6362
// adjusting this late means inconsistencies with earlier code, which for reflection is an issue
6363
// Until reflection is brought in sync with these adjustments, don't apply to $Global,
6364
// which is the most likely to rely on reflection, and least likely to rely implicit layouts
6365
if (glslangIntermediate->usingHlslOffsets() &&
6366
! memberType.isStruct() && structType.getTypeName().compare("$Global") != 0) {
6367
int componentSize;
6368
int componentAlignment = glslangIntermediate->getBaseAlignmentScalar(memberType, componentSize);
6369
if (! memberType.isArray() && isVectorLike && componentAlignment <= 4)
6370
memberAlignment = componentAlignment;
6371
6372
// Don't add unnecessary padding after this member
6373
// (undo std140 bumping size to a mutliple of vec4)
6374
if (explicitLayout == glslang::ElpStd140) {
6375
if (memberType.isMatrix()) {
6376
if (matrixLayout == glslang::ElmRowMajor)
6377
memberSize -= componentSize * (4 - memberType.getMatrixCols());
6378
else
6379
memberSize -= componentSize * (4 - memberType.getMatrixRows());
6380
} else if (memberType.isArray())
6381
memberSize -= componentSize * (4 - memberType.getVectorSize());
6382
}
6383
}
6384
6385
// Bump up to member alignment
6386
glslang::RoundToPow2(currentOffset, memberAlignment);
6387
6388
// Bump up to vec4 if there is a bad straddle
6389
if (explicitLayout != glslang::ElpScalar && glslangIntermediate->improperStraddle(memberType, memberSize,
6390
currentOffset, isVectorLike))
6391
glslang::RoundToPow2(currentOffset, 16);
6392
6393
nextOffset = currentOffset + memberSize;
6394
}
6395
6396
void TGlslangToSpvTraverser::declareUseOfStructMember(const glslang::TTypeList& members, int glslangMember)
6397
{
6398
const glslang::TBuiltInVariable glslangBuiltIn = members[glslangMember].type->getQualifier().builtIn;
6399
switch (glslangBuiltIn)
6400
{
6401
case glslang::EbvPointSize:
6402
case glslang::EbvClipDistance:
6403
case glslang::EbvCullDistance:
6404
case glslang::EbvViewportMaskNV:
6405
case glslang::EbvSecondaryPositionNV:
6406
case glslang::EbvSecondaryViewportMaskNV:
6407
case glslang::EbvPositionPerViewNV:
6408
case glslang::EbvViewportMaskPerViewNV:
6409
case glslang::EbvTaskCountNV:
6410
case glslang::EbvPrimitiveCountNV:
6411
case glslang::EbvPrimitiveIndicesNV:
6412
case glslang::EbvClipDistancePerViewNV:
6413
case glslang::EbvCullDistancePerViewNV:
6414
case glslang::EbvLayerPerViewNV:
6415
case glslang::EbvMeshViewCountNV:
6416
case glslang::EbvMeshViewIndicesNV:
6417
// Generate the associated capability. Delegate to TranslateBuiltInDecoration.
6418
// Alternately, we could just call this for any glslang built-in, since the
6419
// capability already guards against duplicates.
6420
TranslateBuiltInDecoration(glslangBuiltIn, false);
6421
break;
6422
default:
6423
// Capabilities were already generated when the struct was declared.
6424
break;
6425
}
6426
}
6427
6428
bool TGlslangToSpvTraverser::isShaderEntryPoint(const glslang::TIntermAggregate* node)
6429
{
6430
return node->getName().compare(glslangIntermediate->getEntryPointMangledName().c_str()) == 0;
6431
}
6432
6433
// Does parameter need a place to keep writes, separate from the original?
6434
// Assumes called after originalParam(), which filters out block/buffer/opaque-based
6435
// qualifiers such that we should have only in/out/inout/constreadonly here.
6436
bool TGlslangToSpvTraverser::writableParam(glslang::TStorageQualifier qualifier) const
6437
{
6438
assert(qualifier == glslang::EvqIn ||
6439
qualifier == glslang::EvqOut ||
6440
qualifier == glslang::EvqInOut ||
6441
qualifier == glslang::EvqUniform ||
6442
qualifier == glslang::EvqConstReadOnly);
6443
return qualifier != glslang::EvqConstReadOnly &&
6444
qualifier != glslang::EvqUniform;
6445
}
6446
6447
// Is parameter pass-by-original?
6448
bool TGlslangToSpvTraverser::originalParam(glslang::TStorageQualifier qualifier, const glslang::TType& paramType,
6449
bool implicitThisParam)
6450
{
6451
if (implicitThisParam) // implicit this
6452
return true;
6453
if (glslangIntermediate->getSource() == glslang::EShSourceHlsl)
6454
return paramType.getBasicType() == glslang::EbtBlock;
6455
return (paramType.containsOpaque() && !glslangIntermediate->getBindlessMode()) || // sampler, etc.
6456
paramType.getQualifier().isSpirvByReference() || // spirv_by_reference
6457
(paramType.getBasicType() == glslang::EbtBlock && qualifier == glslang::EvqBuffer); // SSBO
6458
}
6459
6460
// Make all the functions, skeletally, without actually visiting their bodies.
6461
void TGlslangToSpvTraverser::makeFunctions(const glslang::TIntermSequence& glslFunctions)
6462
{
6463
const auto getParamDecorations = [&](std::vector<spv::Decoration>& decorations, const glslang::TType& type,
6464
bool useVulkanMemoryModel) {
6465
spv::Decoration paramPrecision = TranslatePrecisionDecoration(type);
6466
if (paramPrecision != spv::NoPrecision)
6467
decorations.push_back(paramPrecision);
6468
TranslateMemoryDecoration(type.getQualifier(), decorations, useVulkanMemoryModel);
6469
if (type.isReference()) {
6470
// Original and non-writable params pass the pointer directly and
6471
// use restrict/aliased, others are stored to a pointer in Function
6472
// memory and use RestrictPointer/AliasedPointer.
6473
if (originalParam(type.getQualifier().storage, type, false) ||
6474
!writableParam(type.getQualifier().storage)) {
6475
// TranslateMemoryDecoration added Restrict decoration already.
6476
if (!type.getQualifier().isRestrict()) {
6477
decorations.push_back(spv::Decoration::Aliased);
6478
}
6479
} else {
6480
decorations.push_back(type.getQualifier().isRestrict() ? spv::Decoration::RestrictPointerEXT :
6481
spv::Decoration::AliasedPointerEXT);
6482
}
6483
}
6484
};
6485
6486
for (int f = 0; f < (int)glslFunctions.size(); ++f) {
6487
glslang::TIntermAggregate* glslFunction = glslFunctions[f]->getAsAggregate();
6488
if (! glslFunction || glslFunction->getOp() != glslang::EOpFunction)
6489
continue;
6490
6491
builder.setDebugSourceLocation(glslFunction->getLoc().line, glslFunction->getLoc().getFilename());
6492
6493
if (isShaderEntryPoint(glslFunction)) {
6494
// For HLSL, the entry function is actually a compiler generated function to resolve the difference of
6495
// entry function signature between HLSL and SPIR-V. So we don't emit debug information for that.
6496
if (glslangIntermediate->getSource() != glslang::EShSourceHlsl) {
6497
builder.setupFunctionDebugInfo(shaderEntry, glslangIntermediate->getEntryPointMangledName().c_str(),
6498
std::vector<spv::Id>(), // main function has no param
6499
std::vector<char const*>());
6500
}
6501
continue;
6502
}
6503
// We're on a user function. Set up the basic interface for the function now,
6504
// so that it's available to call. Translating the body will happen later.
6505
//
6506
// Typically (except for a "const in" parameter), an address will be passed to the
6507
// function. What it is an address of varies:
6508
//
6509
// - "in" parameters not marked as "const" can be written to without modifying the calling
6510
// argument so that write needs to be to a copy, hence the address of a copy works.
6511
//
6512
// - "const in" parameters can just be the r-value, as no writes need occur.
6513
//
6514
// - "out" and "inout" arguments can't be done as pointers to the calling argument, because
6515
// GLSL has copy-in/copy-out semantics. They can be handled though with a pointer to a copy.
6516
6517
std::vector<spv::Id> paramTypes;
6518
std::vector<char const*> paramNames;
6519
std::vector<std::vector<spv::Decoration>> paramDecorations; // list of decorations per parameter
6520
glslang::TIntermSequence& parameters = glslFunction->getSequence()[0]->getAsAggregate()->getSequence();
6521
6522
#ifdef ENABLE_HLSL
6523
bool implicitThis = (int)parameters.size() > 0 && parameters[0]->getAsSymbolNode()->getName() ==
6524
glslangIntermediate->implicitThisName;
6525
#else
6526
bool implicitThis = false;
6527
#endif
6528
6529
paramDecorations.resize(parameters.size());
6530
for (int p = 0; p < (int)parameters.size(); ++p) {
6531
const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();
6532
spv::Id typeId = convertGlslangToSpvType(paramType);
6533
if (originalParam(paramType.getQualifier().storage, paramType, implicitThis && p == 0))
6534
typeId = builder.makePointer(TranslateStorageClass(paramType), typeId);
6535
else if (writableParam(paramType.getQualifier().storage))
6536
typeId = builder.makePointer(spv::StorageClass::Function, typeId);
6537
else
6538
rValueParameters.insert(parameters[p]->getAsSymbolNode()->getId());
6539
getParamDecorations(paramDecorations[p], paramType, glslangIntermediate->usingVulkanMemoryModel());
6540
paramTypes.push_back(typeId);
6541
}
6542
6543
for (auto const parameter:parameters) {
6544
paramNames.push_back(parameter->getAsSymbolNode()->getName().c_str());
6545
}
6546
6547
spv::Block* functionBlock;
6548
spv::Function* function = builder.makeFunctionEntry(
6549
TranslatePrecisionDecoration(glslFunction->getType()), convertGlslangToSpvType(glslFunction->getType()),
6550
glslFunction->getName().c_str(), convertGlslangLinkageToSpv(glslFunction->getLinkType()), paramTypes,
6551
paramDecorations, &functionBlock);
6552
builder.setupFunctionDebugInfo(function, glslFunction->getName().c_str(), paramTypes, paramNames);
6553
if (implicitThis)
6554
function->setImplicitThis();
6555
6556
// Track function to emit/call later
6557
functionMap[glslFunction->getName().c_str()] = function;
6558
6559
// Set the parameter id's
6560
for (int p = 0; p < (int)parameters.size(); ++p) {
6561
symbolValues[parameters[p]->getAsSymbolNode()->getId()] = function->getParamId(p);
6562
// give a name too
6563
builder.addName(function->getParamId(p), parameters[p]->getAsSymbolNode()->getName().c_str());
6564
6565
const glslang::TType& paramType = parameters[p]->getAsTyped()->getType();
6566
if (paramType.contains8BitInt())
6567
builder.addCapability(spv::Capability::Int8);
6568
if (paramType.contains16BitInt())
6569
builder.addCapability(spv::Capability::Int16);
6570
if (paramType.contains16BitFloat())
6571
builder.addCapability(spv::Capability::Float16);
6572
}
6573
}
6574
}
6575
6576
// Process all the initializers, while skipping the functions and link objects
6577
void TGlslangToSpvTraverser::makeGlobalInitializers(const glslang::TIntermSequence& initializers)
6578
{
6579
builder.setBuildPoint(shaderEntry->getLastBlock());
6580
for (int i = 0; i < (int)initializers.size(); ++i) {
6581
glslang::TIntermAggregate* initializer = initializers[i]->getAsAggregate();
6582
if (initializer && initializer->getOp() != glslang::EOpFunction && initializer->getOp() !=
6583
glslang::EOpLinkerObjects) {
6584
6585
// We're on a top-level node that's not a function. Treat as an initializer, whose
6586
// code goes into the beginning of the entry point.
6587
initializer->traverse(this);
6588
}
6589
}
6590
}
6591
// Walk over all linker objects to create a map for payload and callable data linker objects
6592
// and their location to be used during codegen for OpTraceKHR and OpExecuteCallableKHR
6593
// This is done here since it is possible that these linker objects are not be referenced in the AST
6594
void TGlslangToSpvTraverser::collectRayTracingLinkerObjects()
6595
{
6596
glslang::TIntermAggregate* linkerObjects = glslangIntermediate->findLinkerObjects();
6597
for (auto& objSeq : linkerObjects->getSequence()) {
6598
auto objNode = objSeq->getAsSymbolNode();
6599
if (objNode != nullptr) {
6600
if (objNode->getQualifier().hasLocation()) {
6601
unsigned int location = objNode->getQualifier().layoutLocation;
6602
auto st = objNode->getQualifier().storage;
6603
int set;
6604
switch (st)
6605
{
6606
case glslang::EvqPayload:
6607
case glslang::EvqPayloadIn:
6608
set = 0;
6609
break;
6610
case glslang::EvqCallableData:
6611
case glslang::EvqCallableDataIn:
6612
set = 1;
6613
break;
6614
6615
case glslang::EvqHitObjectAttrNV:
6616
case glslang::EvqHitObjectAttrEXT:
6617
set = 2;
6618
break;
6619
6620
default:
6621
set = -1;
6622
}
6623
if (set != -1)
6624
locationToSymbol[set].insert(std::make_pair(location, objNode));
6625
}
6626
}
6627
}
6628
}
6629
// Process all the functions, while skipping initializers.
6630
void TGlslangToSpvTraverser::visitFunctions(const glslang::TIntermSequence& glslFunctions)
6631
{
6632
for (int f = 0; f < (int)glslFunctions.size(); ++f) {
6633
glslang::TIntermAggregate* node = glslFunctions[f]->getAsAggregate();
6634
if (node && (node->getOp() == glslang::EOpFunction || node->getOp() == glslang::EOpLinkerObjects))
6635
node->traverse(this);
6636
}
6637
}
6638
6639
void TGlslangToSpvTraverser::translateArguments(const glslang::TIntermAggregate& node, std::vector<spv::Id>& arguments,
6640
spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags)
6641
{
6642
const glslang::TIntermSequence& glslangArguments = node.getSequence();
6643
6644
glslang::TSampler sampler = {};
6645
bool cubeCompare = false;
6646
bool f16ShadowCompare = false;
6647
if (node.isTexture() || node.isImage()) {
6648
sampler = glslangArguments[0]->getAsTyped()->getType().getSampler();
6649
cubeCompare = sampler.dim == glslang::EsdCube && sampler.arrayed && sampler.shadow;
6650
f16ShadowCompare = sampler.shadow &&
6651
glslangArguments[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16;
6652
}
6653
6654
for (int i = 0; i < (int)glslangArguments.size(); ++i) {
6655
builder.clearAccessChain();
6656
glslangArguments[i]->traverse(this);
6657
6658
// Special case l-value operands
6659
bool lvalue = false;
6660
switch (node.getOp()) {
6661
case glslang::EOpImageAtomicAdd:
6662
case glslang::EOpImageAtomicMin:
6663
case glslang::EOpImageAtomicMax:
6664
case glslang::EOpImageAtomicAnd:
6665
case glslang::EOpImageAtomicOr:
6666
case glslang::EOpImageAtomicXor:
6667
case glslang::EOpImageAtomicExchange:
6668
case glslang::EOpImageAtomicCompSwap:
6669
case glslang::EOpImageAtomicLoad:
6670
case glslang::EOpImageAtomicStore:
6671
if (i == 0)
6672
lvalue = true;
6673
break;
6674
case glslang::EOpSparseImageLoad:
6675
if ((sampler.ms && i == 3) || (! sampler.ms && i == 2))
6676
lvalue = true;
6677
break;
6678
case glslang::EOpSparseTexture:
6679
if (((cubeCompare || f16ShadowCompare) && i == 3) || (! (cubeCompare || f16ShadowCompare) && i == 2))
6680
lvalue = true;
6681
break;
6682
case glslang::EOpSparseTextureClamp:
6683
if (((cubeCompare || f16ShadowCompare) && i == 4) || (! (cubeCompare || f16ShadowCompare) && i == 3))
6684
lvalue = true;
6685
break;
6686
case glslang::EOpSparseTextureLod:
6687
case glslang::EOpSparseTextureOffset:
6688
if ((f16ShadowCompare && i == 4) || (! f16ShadowCompare && i == 3))
6689
lvalue = true;
6690
break;
6691
case glslang::EOpSparseTextureFetch:
6692
if ((sampler.dim != glslang::EsdRect && i == 3) || (sampler.dim == glslang::EsdRect && i == 2))
6693
lvalue = true;
6694
break;
6695
case glslang::EOpSparseTextureFetchOffset:
6696
if ((sampler.dim != glslang::EsdRect && i == 4) || (sampler.dim == glslang::EsdRect && i == 3))
6697
lvalue = true;
6698
break;
6699
case glslang::EOpSparseTextureLodOffset:
6700
case glslang::EOpSparseTextureGrad:
6701
case glslang::EOpSparseTextureOffsetClamp:
6702
if ((f16ShadowCompare && i == 5) || (! f16ShadowCompare && i == 4))
6703
lvalue = true;
6704
break;
6705
case glslang::EOpSparseTextureGradOffset:
6706
case glslang::EOpSparseTextureGradClamp:
6707
if ((f16ShadowCompare && i == 6) || (! f16ShadowCompare && i == 5))
6708
lvalue = true;
6709
break;
6710
case glslang::EOpSparseTextureGradOffsetClamp:
6711
if ((f16ShadowCompare && i == 7) || (! f16ShadowCompare && i == 6))
6712
lvalue = true;
6713
break;
6714
case glslang::EOpSparseTextureGather:
6715
if ((sampler.shadow && i == 3) || (! sampler.shadow && i == 2))
6716
lvalue = true;
6717
break;
6718
case glslang::EOpSparseTextureGatherOffset:
6719
case glslang::EOpSparseTextureGatherOffsets:
6720
if ((sampler.shadow && i == 4) || (! sampler.shadow && i == 3))
6721
lvalue = true;
6722
break;
6723
case glslang::EOpSparseTextureGatherLod:
6724
if (i == 3)
6725
lvalue = true;
6726
break;
6727
case glslang::EOpSparseTextureGatherLodOffset:
6728
case glslang::EOpSparseTextureGatherLodOffsets:
6729
if (i == 4)
6730
lvalue = true;
6731
break;
6732
case glslang::EOpSparseImageLoadLod:
6733
if (i == 3)
6734
lvalue = true;
6735
break;
6736
case glslang::EOpImageSampleFootprintNV:
6737
if (i == 4)
6738
lvalue = true;
6739
break;
6740
case glslang::EOpImageSampleFootprintClampNV:
6741
case glslang::EOpImageSampleFootprintLodNV:
6742
if (i == 5)
6743
lvalue = true;
6744
break;
6745
case glslang::EOpImageSampleFootprintGradNV:
6746
if (i == 6)
6747
lvalue = true;
6748
break;
6749
case glslang::EOpImageSampleFootprintGradClampNV:
6750
if (i == 7)
6751
lvalue = true;
6752
break;
6753
case glslang::EOpRayQueryGetIntersectionTriangleVertexPositionsEXT:
6754
case glslang::EOpRayQueryGetIntersectionLSSPositionsNV:
6755
case glslang::EOpRayQueryGetIntersectionLSSRadiiNV:
6756
if (i == 2)
6757
lvalue = true;
6758
break;
6759
case glslang::EOpConstructSaturated:
6760
if (i == 0)
6761
lvalue = true;
6762
break;
6763
default:
6764
break;
6765
}
6766
6767
if (lvalue) {
6768
spv::Id lvalue_id = builder.accessChainGetLValue();
6769
arguments.push_back(lvalue_id);
6770
lvalueCoherentFlags = builder.getAccessChain().coherentFlags;
6771
builder.addDecoration(lvalue_id, TranslateNonUniformDecoration(lvalueCoherentFlags));
6772
lvalueCoherentFlags |= TranslateCoherent(glslangArguments[i]->getAsTyped()->getType());
6773
} else {
6774
if (i > 0 &&
6775
glslangArguments[i]->getAsSymbolNode() && glslangArguments[i-1]->getAsSymbolNode() &&
6776
glslangArguments[i]->getAsSymbolNode()->getId() == glslangArguments[i-1]->getAsSymbolNode()->getId()) {
6777
// Reuse the id if possible
6778
arguments.push_back(arguments[i-1]);
6779
} else {
6780
arguments.push_back(accessChainLoad(glslangArguments[i]->getAsTyped()->getType()));
6781
}
6782
}
6783
}
6784
}
6785
6786
void TGlslangToSpvTraverser::translateArguments(glslang::TIntermUnary& node, std::vector<spv::Id>& arguments)
6787
{
6788
builder.clearAccessChain();
6789
node.getOperand()->traverse(this);
6790
arguments.push_back(accessChainLoad(node.getOperand()->getType()));
6791
}
6792
6793
spv::Id TGlslangToSpvTraverser::createImageTextureFunctionCall(glslang::TIntermOperator* node)
6794
{
6795
if (! node->isImage() && ! node->isTexture())
6796
return spv::NoResult;
6797
6798
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
6799
6800
// Process a GLSL texturing op (will be SPV image)
6801
6802
const glslang::TType &imageType = node->getAsAggregate()
6803
? node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType()
6804
: node->getAsUnaryNode()->getOperand()->getAsTyped()->getType();
6805
const glslang::TSampler sampler = imageType.getSampler();
6806
bool f16ShadowCompare = (sampler.shadow && node->getAsAggregate())
6807
? node->getAsAggregate()->getSequence()[1]->getAsTyped()->getType().getBasicType() == glslang::EbtFloat16
6808
: false;
6809
6810
const auto signExtensionMask = [&]() {
6811
if (builder.getSpvVersion() >= spv::Spv_1_4) {
6812
if (sampler.type == glslang::EbtUint)
6813
return spv::ImageOperandsMask::ZeroExtend;
6814
else if (sampler.type == glslang::EbtInt)
6815
return spv::ImageOperandsMask::SignExtend;
6816
}
6817
return spv::ImageOperandsMask::MaskNone;
6818
};
6819
6820
spv::Builder::AccessChain::CoherentFlags lvalueCoherentFlags;
6821
6822
std::vector<spv::Id> arguments;
6823
if (node->getAsAggregate())
6824
translateArguments(*node->getAsAggregate(), arguments, lvalueCoherentFlags);
6825
else
6826
translateArguments(*node->getAsUnaryNode(), arguments);
6827
spv::Decoration precision = TranslatePrecisionDecoration(node->getType());
6828
6829
spv::Builder::TextureParameters params = { };
6830
params.sampler = arguments[0];
6831
6832
glslang::TCrackedTextureOp cracked;
6833
node->crackTexture(sampler, cracked);
6834
6835
const bool isUnsignedResult = node->getType().getBasicType() == glslang::EbtUint;
6836
6837
if (builder.isSampledImage(params.sampler) &&
6838
((cracked.query && node->getOp() != glslang::EOpTextureQueryLod) || cracked.fragMask || cracked.fetch)) {
6839
params.sampler = builder.createUnaryOp(spv::Op::OpImage, builder.getImageType(params.sampler), params.sampler);
6840
if (imageType.getQualifier().isNonUniform()) {
6841
builder.addDecoration(params.sampler, spv::Decoration::NonUniformEXT);
6842
}
6843
}
6844
// Check for queries
6845
if (cracked.query) {
6846
switch (node->getOp()) {
6847
case glslang::EOpImageQuerySize:
6848
case glslang::EOpTextureQuerySize:
6849
if (arguments.size() > 1) {
6850
params.lod = arguments[1];
6851
return builder.createTextureQueryCall(spv::Op::OpImageQuerySizeLod, params, isUnsignedResult);
6852
} else
6853
return builder.createTextureQueryCall(spv::Op::OpImageQuerySize, params, isUnsignedResult);
6854
case glslang::EOpImageQuerySamples:
6855
case glslang::EOpTextureQuerySamples:
6856
return builder.createTextureQueryCall(spv::Op::OpImageQuerySamples, params, isUnsignedResult);
6857
case glslang::EOpTextureQueryLod:
6858
params.coords = arguments[1];
6859
return builder.createTextureQueryCall(spv::Op::OpImageQueryLod, params, isUnsignedResult);
6860
case glslang::EOpTextureQueryLevels:
6861
return builder.createTextureQueryCall(spv::Op::OpImageQueryLevels, params, isUnsignedResult);
6862
case glslang::EOpSparseTexelsResident:
6863
return builder.createUnaryOp(spv::Op::OpImageSparseTexelsResident, builder.makeBoolType(), arguments[0]);
6864
default:
6865
assert(0);
6866
break;
6867
}
6868
}
6869
6870
int components = node->getType().getVectorSize();
6871
6872
if (node->getOp() == glslang::EOpImageLoad ||
6873
node->getOp() == glslang::EOpImageLoadLod ||
6874
node->getOp() == glslang::EOpTextureFetch ||
6875
node->getOp() == glslang::EOpTextureFetchOffset) {
6876
// These must produce 4 components, per SPIR-V spec. We'll add a conversion constructor if needed.
6877
// This will only happen through the HLSL path for operator[], so we do not have to handle e.g.
6878
// the EOpTexture/Proj/Lod/etc family. It would be harmless to do so, but would need more logic
6879
// here around e.g. which ones return scalars or other types.
6880
components = 4;
6881
}
6882
6883
glslang::TType returnType(node->getType().getBasicType(), glslang::EvqTemporary, components);
6884
6885
auto resultType = [&returnType,this]{ return convertGlslangToSpvType(returnType); };
6886
6887
// Check for image functions other than queries
6888
if (node->isImage()) {
6889
std::vector<spv::IdImmediate> operands;
6890
auto opIt = arguments.begin();
6891
spv::IdImmediate image = { true, *(opIt++) };
6892
operands.push_back(image);
6893
6894
// Handle subpass operations
6895
// TODO: GLSL should change to have the "MS" only on the type rather than the
6896
// built-in function.
6897
if (cracked.subpass) {
6898
// add on the (0,0) coordinate
6899
spv::Id zero = builder.makeIntConstant(0);
6900
std::vector<spv::Id> comps;
6901
comps.push_back(zero);
6902
comps.push_back(zero);
6903
spv::IdImmediate coord = { true,
6904
builder.makeCompositeConstant(builder.makeVectorType(builder.makeIntType(32), 2), comps) };
6905
operands.push_back(coord);
6906
spv::IdImmediate imageOperands = { false, spv::ImageOperandsMask::MaskNone };
6907
imageOperands.word = imageOperands.word | (unsigned)signExtensionMask();
6908
if (sampler.isMultiSample()) {
6909
imageOperands.word = imageOperands.word | (unsigned)spv::ImageOperandsMask::Sample;
6910
}
6911
if (imageOperands.word != (unsigned)spv::ImageOperandsMask::MaskNone) {
6912
operands.push_back(imageOperands);
6913
if (sampler.isMultiSample()) {
6914
spv::IdImmediate imageOperand = { true, *(opIt++) };
6915
operands.push_back(imageOperand);
6916
}
6917
}
6918
spv::Id result = builder.createOp(spv::Op::OpImageRead, resultType(), operands);
6919
builder.setPrecision(result, precision);
6920
return result;
6921
}
6922
6923
if (cracked.attachmentEXT) {
6924
if (opIt != arguments.end()) {
6925
spv::IdImmediate sample = { true, *opIt };
6926
operands.push_back(sample);
6927
}
6928
spv::Id result = builder.createOp(spv::Op::OpColorAttachmentReadEXT, resultType(), operands);
6929
builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
6930
builder.setPrecision(result, precision);
6931
return result;
6932
}
6933
6934
spv::IdImmediate coord = { true, *(opIt++) };
6935
operands.push_back(coord);
6936
if (node->getOp() == glslang::EOpImageLoad || node->getOp() == glslang::EOpImageLoadLod) {
6937
spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
6938
if (sampler.isMultiSample()) {
6939
mask = mask | spv::ImageOperandsMask::Sample;
6940
}
6941
if (cracked.lod) {
6942
builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
6943
builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
6944
mask = mask | spv::ImageOperandsMask::Lod;
6945
}
6946
mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
6947
mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelAvailableKHR);
6948
mask = mask | signExtensionMask();
6949
if (mask != spv::ImageOperandsMask::MaskNone) {
6950
spv::IdImmediate imageOperands = { false, (unsigned int)mask };
6951
operands.push_back(imageOperands);
6952
}
6953
if (anySet(mask, spv::ImageOperandsMask::Sample)) {
6954
spv::IdImmediate imageOperand = { true, *opIt++ };
6955
operands.push_back(imageOperand);
6956
}
6957
if (anySet(mask, spv::ImageOperandsMask::Lod)) {
6958
spv::IdImmediate imageOperand = { true, *opIt++ };
6959
operands.push_back(imageOperand);
6960
}
6961
if (anySet(mask, spv::ImageOperandsMask::MakeTexelVisibleKHR)) {
6962
spv::IdImmediate imageOperand = { true,
6963
builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
6964
operands.push_back(imageOperand);
6965
}
6966
6967
if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
6968
builder.addCapability(spv::Capability::StorageImageReadWithoutFormat);
6969
6970
std::vector<spv::Id> result(1, builder.createOp(spv::Op::OpImageRead, resultType(), operands));
6971
builder.setPrecision(result[0], precision);
6972
6973
// If needed, add a conversion constructor to the proper size.
6974
if (components != node->getType().getVectorSize())
6975
result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));
6976
6977
return result[0];
6978
} else if (node->getOp() == glslang::EOpImageStore || node->getOp() == glslang::EOpImageStoreLod) {
6979
6980
// Push the texel value before the operands
6981
if (sampler.isMultiSample() || cracked.lod) {
6982
spv::IdImmediate texel = { true, *(opIt + 1) };
6983
operands.push_back(texel);
6984
} else {
6985
spv::IdImmediate texel = { true, *opIt };
6986
operands.push_back(texel);
6987
}
6988
6989
spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
6990
if (sampler.isMultiSample()) {
6991
mask = mask | spv::ImageOperandsMask::Sample;
6992
}
6993
if (cracked.lod) {
6994
builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
6995
builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
6996
mask = mask | spv::ImageOperandsMask::Lod;
6997
}
6998
mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
6999
mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelVisibleKHR);
7000
mask = mask | signExtensionMask();
7001
if (mask != spv::ImageOperandsMask::MaskNone) {
7002
spv::IdImmediate imageOperands = { false, (unsigned int)mask };
7003
operands.push_back(imageOperands);
7004
}
7005
if (anySet(mask, spv::ImageOperandsMask::Sample)) {
7006
spv::IdImmediate imageOperand = { true, *opIt++ };
7007
operands.push_back(imageOperand);
7008
}
7009
if (anySet(mask, spv::ImageOperandsMask::Lod)) {
7010
spv::IdImmediate imageOperand = { true, *opIt++ };
7011
operands.push_back(imageOperand);
7012
}
7013
if (anySet(mask, spv::ImageOperandsMask::MakeTexelAvailableKHR)) {
7014
spv::IdImmediate imageOperand = { true,
7015
builder.makeUintConstant(TranslateMemoryScope(TranslateCoherent(imageType))) };
7016
operands.push_back(imageOperand);
7017
}
7018
7019
builder.createNoResultOp(spv::Op::OpImageWrite, operands);
7020
if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
7021
builder.addCapability(spv::Capability::StorageImageWriteWithoutFormat);
7022
return spv::NoResult;
7023
} else if (node->getOp() == glslang::EOpSparseImageLoad ||
7024
node->getOp() == glslang::EOpSparseImageLoadLod) {
7025
builder.addCapability(spv::Capability::SparseResidency);
7026
if (builder.getImageTypeFormat(builder.getImageType(operands.front().word)) == spv::ImageFormat::Unknown)
7027
builder.addCapability(spv::Capability::StorageImageReadWithoutFormat);
7028
7029
spv::ImageOperandsMask mask = spv::ImageOperandsMask::MaskNone;
7030
if (sampler.isMultiSample()) {
7031
mask = mask | spv::ImageOperandsMask::Sample;
7032
}
7033
if (cracked.lod) {
7034
builder.addExtension(spv::E_SPV_AMD_shader_image_load_store_lod);
7035
builder.addCapability(spv::Capability::ImageReadWriteLodAMD);
7036
7037
mask = mask | spv::ImageOperandsMask::Lod;
7038
}
7039
mask = mask | TranslateImageOperands(TranslateCoherent(imageType));
7040
mask = (spv::ImageOperandsMask)(mask & ~spv::ImageOperandsMask::MakeTexelAvailableKHR);
7041
mask = mask | signExtensionMask();
7042
if (mask != spv::ImageOperandsMask::MaskNone) {
7043
spv::IdImmediate imageOperands = { false, (unsigned int)mask };
7044
operands.push_back(imageOperands);
7045
}
7046
if (anySet(mask, spv::ImageOperandsMask::Sample)) {
7047
spv::IdImmediate imageOperand = { true, *opIt++ };
7048
operands.push_back(imageOperand);
7049
}
7050
if (anySet(mask, spv::ImageOperandsMask::Lod)) {
7051
spv::IdImmediate imageOperand = { true, *opIt++ };
7052
operands.push_back(imageOperand);
7053
}
7054
if (anySet(mask, spv::ImageOperandsMask::MakeTexelVisibleKHR)) {
7055
spv::IdImmediate imageOperand = { true, builder.makeUintConstant(TranslateMemoryScope(
7056
TranslateCoherent(imageType))) };
7057
operands.push_back(imageOperand);
7058
}
7059
7060
// Create the return type that was a special structure
7061
spv::Id texelOut = *opIt;
7062
spv::Id typeId0 = resultType();
7063
spv::Id typeId1 = builder.getDerefTypeId(texelOut);
7064
spv::Id resultTypeId = builder.makeStructResultType(typeId0, typeId1);
7065
7066
spv::Id resultId = builder.createOp(spv::Op::OpImageSparseRead, resultTypeId, operands);
7067
7068
// Decode the return type
7069
builder.createStore(builder.createCompositeExtract(resultId, typeId1, 1), texelOut);
7070
return builder.createCompositeExtract(resultId, typeId0, 0);
7071
} else {
7072
// Process image atomic operations
7073
7074
// GLSL "IMAGE_PARAMS" will involve in constructing an image texel pointer and this pointer,
7075
// as the first source operand, is required by SPIR-V atomic operations.
7076
// For non-MS, the sample value should be 0
7077
spv::IdImmediate sample = { true, sampler.isMultiSample() ? *(opIt++) : builder.makeUintConstant(0) };
7078
operands.push_back(sample);
7079
7080
spv::Id resultTypeId;
7081
glslang::TBasicType typeProxy = node->getBasicType();
7082
// imageAtomicStore has a void return type so base the pointer type on
7083
// the type of the value operand.
7084
if (node->getOp() == glslang::EOpImageAtomicStore) {
7085
resultTypeId = builder.makePointer(spv::StorageClass::Image, builder.getTypeId(*opIt));
7086
typeProxy = node->getAsAggregate()->getSequence()[0]->getAsTyped()->getType().getSampler().type;
7087
} else {
7088
resultTypeId = builder.makePointer(spv::StorageClass::Image, resultType());
7089
}
7090
spv::Id pointer = builder.createOp(spv::Op::OpImageTexelPointer, resultTypeId, operands);
7091
if (imageType.getQualifier().nonUniform) {
7092
builder.addDecoration(pointer, spv::Decoration::NonUniformEXT);
7093
}
7094
7095
std::vector<spv::Id> operands;
7096
operands.push_back(pointer);
7097
for (; opIt != arguments.end(); ++opIt)
7098
operands.push_back(*opIt);
7099
7100
return createAtomicOperation(node->getOp(), precision, resultType(), operands, typeProxy,
7101
lvalueCoherentFlags, node->getType());
7102
}
7103
}
7104
7105
// Check for fragment mask functions other than queries
7106
if (cracked.fragMask) {
7107
assert(sampler.ms);
7108
7109
auto opIt = arguments.begin();
7110
std::vector<spv::Id> operands;
7111
7112
operands.push_back(params.sampler);
7113
++opIt;
7114
7115
if (sampler.isSubpass()) {
7116
// add on the (0,0) coordinate
7117
spv::Id zero = builder.makeIntConstant(0);
7118
std::vector<spv::Id> comps;
7119
comps.push_back(zero);
7120
comps.push_back(zero);
7121
operands.push_back(builder.makeCompositeConstant(
7122
builder.makeVectorType(builder.makeIntType(32), 2), comps));
7123
}
7124
7125
for (; opIt != arguments.end(); ++opIt)
7126
operands.push_back(*opIt);
7127
7128
spv::Op fragMaskOp = spv::Op::OpNop;
7129
if (node->getOp() == glslang::EOpFragmentMaskFetch)
7130
fragMaskOp = spv::Op::OpFragmentMaskFetchAMD;
7131
else if (node->getOp() == glslang::EOpFragmentFetch)
7132
fragMaskOp = spv::Op::OpFragmentFetchAMD;
7133
7134
builder.addExtension(spv::E_SPV_AMD_shader_fragment_mask);
7135
builder.addCapability(spv::Capability::FragmentMaskAMD);
7136
return builder.createOp(fragMaskOp, resultType(), operands);
7137
}
7138
7139
// Check for texture functions other than queries
7140
bool sparse = node->isSparseTexture();
7141
bool imageFootprint = node->isImageFootprint();
7142
bool cubeCompare = sampler.dim == glslang::EsdCube && sampler.isArrayed() && sampler.isShadow();
7143
7144
// check for bias argument
7145
bool bias = false;
7146
if (! cracked.lod && ! cracked.grad && ! cracked.fetch && ! cubeCompare) {
7147
int nonBiasArgCount = 2;
7148
if (cracked.gather)
7149
++nonBiasArgCount; // comp argument should be present when bias argument is present
7150
7151
if (f16ShadowCompare)
7152
++nonBiasArgCount;
7153
if (cracked.offset)
7154
++nonBiasArgCount;
7155
else if (cracked.offsets)
7156
++nonBiasArgCount;
7157
if (cracked.grad)
7158
nonBiasArgCount += 2;
7159
if (cracked.lodClamp)
7160
++nonBiasArgCount;
7161
if (sparse)
7162
++nonBiasArgCount;
7163
if (imageFootprint)
7164
//Following three extra arguments
7165
// int granularity, bool coarse, out gl_TextureFootprint2DNV footprint
7166
nonBiasArgCount += 3;
7167
if ((int)arguments.size() > nonBiasArgCount)
7168
bias = true;
7169
}
7170
7171
if (cracked.gather) {
7172
const auto& sourceExtensions = glslangIntermediate->getRequestedExtensions();
7173
if (bias || cracked.lod ||
7174
sourceExtensions.find(glslang::E_GL_AMD_texture_gather_bias_lod) != sourceExtensions.end()) {
7175
builder.addExtension(spv::E_SPV_AMD_texture_gather_bias_lod);
7176
builder.addCapability(spv::Capability::ImageGatherBiasLodAMD);
7177
}
7178
}
7179
7180
// set the rest of the arguments
7181
7182
params.coords = arguments[1];
7183
int extraArgs = 0;
7184
bool noImplicitLod = false;
7185
7186
// sort out where Dref is coming from
7187
if (cubeCompare || f16ShadowCompare) {
7188
params.Dref = arguments[2];
7189
++extraArgs;
7190
} else if (sampler.shadow && cracked.gather) {
7191
params.Dref = arguments[2];
7192
++extraArgs;
7193
} else if (sampler.shadow) {
7194
std::vector<spv::Id> indexes;
7195
int dRefComp;
7196
if (cracked.proj)
7197
dRefComp = 2; // "The resulting 3rd component of P in the shadow forms is used as Dref"
7198
else
7199
dRefComp = builder.getNumComponents(params.coords) - 1;
7200
indexes.push_back(dRefComp);
7201
params.Dref = builder.createCompositeExtract(params.coords,
7202
builder.getScalarTypeId(builder.getTypeId(params.coords)), indexes);
7203
}
7204
7205
// lod
7206
if (cracked.lod) {
7207
params.lod = arguments[2 + extraArgs];
7208
++extraArgs;
7209
} else if (glslangIntermediate->getStage() != EShLangFragment &&
7210
!(glslangIntermediate->getStage() == EShLangCompute &&
7211
glslangIntermediate->hasLayoutDerivativeModeNone())) {
7212
// we need to invent the default lod for an explicit lod instruction for a non-fragment stage
7213
noImplicitLod = true;
7214
}
7215
7216
// multisample
7217
if (sampler.isMultiSample()) {
7218
params.sample = arguments[2 + extraArgs]; // For MS, "sample" should be specified
7219
++extraArgs;
7220
}
7221
7222
// gradient
7223
if (cracked.grad) {
7224
params.gradX = arguments[2 + extraArgs];
7225
params.gradY = arguments[3 + extraArgs];
7226
extraArgs += 2;
7227
}
7228
7229
// offset and offsets
7230
if (cracked.offset) {
7231
params.offset = arguments[2 + extraArgs];
7232
++extraArgs;
7233
} else if (cracked.offsets) {
7234
params.offsets = arguments[2 + extraArgs];
7235
++extraArgs;
7236
}
7237
7238
// lod clamp
7239
if (cracked.lodClamp) {
7240
params.lodClamp = arguments[2 + extraArgs];
7241
++extraArgs;
7242
}
7243
// sparse
7244
if (sparse) {
7245
params.texelOut = arguments[2 + extraArgs];
7246
++extraArgs;
7247
}
7248
// gather component
7249
if (cracked.gather && ! sampler.shadow) {
7250
// default component is 0, if missing, otherwise an argument
7251
if (2 + extraArgs < (int)arguments.size()) {
7252
params.component = arguments[2 + extraArgs];
7253
++extraArgs;
7254
} else
7255
params.component = builder.makeIntConstant(0);
7256
}
7257
spv::Id resultStruct = spv::NoResult;
7258
if (imageFootprint) {
7259
//Following three extra arguments
7260
// int granularity, bool coarse, out gl_TextureFootprint2DNV footprint
7261
params.granularity = arguments[2 + extraArgs];
7262
params.coarse = arguments[3 + extraArgs];
7263
resultStruct = arguments[4 + extraArgs];
7264
extraArgs += 3;
7265
}
7266
7267
// bias
7268
if (bias) {
7269
params.bias = arguments[2 + extraArgs];
7270
++extraArgs;
7271
}
7272
7273
if (imageFootprint) {
7274
builder.addExtension(spv::E_SPV_NV_shader_image_footprint);
7275
builder.addCapability(spv::Capability::ImageFootprintNV);
7276
7277
7278
//resultStructType(OpenGL type) contains 5 elements:
7279
//struct gl_TextureFootprint2DNV {
7280
// uvec2 anchor;
7281
// uvec2 offset;
7282
// uvec2 mask;
7283
// uint lod;
7284
// uint granularity;
7285
//};
7286
//or
7287
//struct gl_TextureFootprint3DNV {
7288
// uvec3 anchor;
7289
// uvec3 offset;
7290
// uvec2 mask;
7291
// uint lod;
7292
// uint granularity;
7293
//};
7294
spv::Id resultStructType = builder.getContainedTypeId(builder.getTypeId(resultStruct));
7295
assert(builder.isStructType(resultStructType));
7296
7297
//resType (SPIR-V type) contains 6 elements:
7298
//Member 0 must be a Boolean type scalar(LOD),
7299
//Member 1 must be a vector of integer type, whose Signedness operand is 0(anchor),
7300
//Member 2 must be a vector of integer type, whose Signedness operand is 0(offset),
7301
//Member 3 must be a vector of integer type, whose Signedness operand is 0(mask),
7302
//Member 4 must be a scalar of integer type, whose Signedness operand is 0(lod),
7303
//Member 5 must be a scalar of integer type, whose Signedness operand is 0(granularity).
7304
std::vector<spv::Id> members;
7305
members.push_back(resultType());
7306
for (int i = 0; i < 5; i++) {
7307
members.push_back(builder.getContainedTypeId(resultStructType, i));
7308
}
7309
spv::Id resType = builder.makeStructType(members, {}, "ResType");
7310
7311
//call ImageFootprintNV
7312
spv::Id res = builder.createTextureCall(precision, resType, sparse, cracked.fetch, cracked.proj,
7313
cracked.gather, noImplicitLod, params, signExtensionMask());
7314
7315
//copy resType (SPIR-V type) to resultStructType(OpenGL type)
7316
for (int i = 0; i < 5; i++) {
7317
builder.clearAccessChain();
7318
builder.setAccessChainLValue(resultStruct);
7319
7320
//Accessing to a struct we created, no coherent flag is set
7321
spv::Builder::AccessChain::CoherentFlags flags;
7322
flags.clear();
7323
7324
builder.accessChainPush(builder.makeIntConstant(i), flags, 0);
7325
builder.accessChainStore(builder.createCompositeExtract(res, builder.getContainedTypeId(resType, i+1),
7326
i+1), TranslateNonUniformDecoration(imageType.getQualifier()));
7327
}
7328
return builder.createCompositeExtract(res, resultType(), 0);
7329
}
7330
7331
// projective component (might not to move)
7332
// GLSL: "The texture coordinates consumed from P, not including the last component of P,
7333
// are divided by the last component of P."
7334
// SPIR-V: "... (u [, v] [, w], q)... It may be a vector larger than needed, but all
7335
// unused components will appear after all used components."
7336
if (cracked.proj) {
7337
int projSourceComp = builder.getNumComponents(params.coords) - 1;
7338
int projTargetComp;
7339
switch (sampler.dim) {
7340
case glslang::Esd1D: projTargetComp = 1; break;
7341
case glslang::Esd2D: projTargetComp = 2; break;
7342
case glslang::EsdRect: projTargetComp = 2; break;
7343
default: projTargetComp = projSourceComp; break;
7344
}
7345
// copy the projective coordinate if we have to
7346
if (projTargetComp != projSourceComp) {
7347
spv::Id projComp = builder.createCompositeExtract(params.coords,
7348
builder.getScalarTypeId(builder.getTypeId(params.coords)), projSourceComp);
7349
params.coords = builder.createCompositeInsert(projComp, params.coords,
7350
builder.getTypeId(params.coords), projTargetComp);
7351
}
7352
}
7353
7354
// nonprivate
7355
if (imageType.getQualifier().nonprivate) {
7356
params.nonprivate = true;
7357
}
7358
7359
// volatile
7360
if (imageType.getQualifier().volatil) {
7361
params.volatil = true;
7362
}
7363
7364
if (imageType.getQualifier().nontemporal) {
7365
params.nontemporal = true;
7366
}
7367
7368
std::vector<spv::Id> result( 1,
7369
builder.createTextureCall(precision, resultType(), sparse, cracked.fetch, cracked.proj, cracked.gather,
7370
noImplicitLod, params, signExtensionMask())
7371
);
7372
7373
if (components != node->getType().getVectorSize())
7374
result[0] = builder.createConstructor(precision, result, convertGlslangToSpvType(node->getType()));
7375
7376
return result[0];
7377
}
7378
7379
spv::Id TGlslangToSpvTraverser::handleUserFunctionCall(const glslang::TIntermAggregate* node)
7380
{
7381
// Grab the function's pointer from the previously created function
7382
spv::Function* function = functionMap[node->getName().c_str()];
7383
if (! function)
7384
return 0;
7385
7386
const glslang::TIntermSequence& glslangArgs = node->getSequence();
7387
const glslang::TQualifierList& qualifiers = node->getQualifierList();
7388
7389
// See comments in makeFunctions() for details about the semantics for parameter passing.
7390
//
7391
// These imply we need a four step process:
7392
// 1. Evaluate the arguments
7393
// 2. Allocate and make copies of in, out, and inout arguments
7394
// 3. Make the call
7395
// 4. Copy back the results
7396
7397
// 1. Evaluate the arguments and their types
7398
std::vector<spv::Builder::AccessChain> lValues;
7399
std::vector<spv::Id> rValues;
7400
std::vector<const glslang::TType*> argTypes;
7401
for (int a = 0; a < (int)glslangArgs.size(); ++a) {
7402
argTypes.push_back(&glslangArgs[a]->getAsTyped()->getType());
7403
// build l-value
7404
builder.clearAccessChain();
7405
glslangArgs[a]->traverse(this);
7406
// keep outputs and pass-by-originals as l-values, evaluate others as r-values
7407
if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0) ||
7408
writableParam(qualifiers[a])) {
7409
// save l-value
7410
lValues.push_back(builder.getAccessChain());
7411
} else {
7412
// process r-value
7413
rValues.push_back(accessChainLoad(*argTypes.back()));
7414
}
7415
}
7416
7417
// Reset source location to the function call location after argument evaluation
7418
builder.setDebugSourceLocation(node->getLoc().line, node->getLoc().getFilename());
7419
7420
// 2. Allocate space for anything needing a copy, and if it's "in" or "inout"
7421
// copy the original into that space.
7422
//
7423
// Also, build up the list of actual arguments to pass in for the call
7424
int lValueCount = 0;
7425
int rValueCount = 0;
7426
std::vector<spv::Id> spvArgs;
7427
for (int a = 0; a < (int)glslangArgs.size(); ++a) {
7428
spv::Id arg;
7429
if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0)) {
7430
builder.setAccessChain(lValues[lValueCount]);
7431
arg = builder.accessChainGetLValue();
7432
++lValueCount;
7433
} else if (writableParam(qualifiers[a])) {
7434
// need space to hold the copy
7435
arg = builder.createVariable(function->getParamPrecision(a), spv::StorageClass::Function,
7436
builder.getContainedTypeId(function->getParamType(a)), "param");
7437
if (qualifiers[a] == glslang::EvqIn || qualifiers[a] == glslang::EvqInOut) {
7438
// need to copy the input into output space
7439
builder.setAccessChain(lValues[lValueCount]);
7440
spv::Id copy = accessChainLoad(*argTypes[a]);
7441
builder.clearAccessChain();
7442
builder.setAccessChainLValue(arg);
7443
multiTypeStore(*argTypes[a], copy);
7444
}
7445
++lValueCount;
7446
} else {
7447
// process r-value, which involves a copy for a type mismatch
7448
if (function->getParamType(a) != builder.getTypeId(rValues[rValueCount]) ||
7449
TranslatePrecisionDecoration(*argTypes[a]) != function->getParamPrecision(a))
7450
{
7451
spv::Id argCopy = builder.createVariable(function->getParamPrecision(a), spv::StorageClass::Function, function->getParamType(a), "arg");
7452
builder.clearAccessChain();
7453
builder.setAccessChainLValue(argCopy);
7454
multiTypeStore(*argTypes[a], rValues[rValueCount]);
7455
arg = builder.createLoad(argCopy, function->getParamPrecision(a));
7456
} else
7457
arg = rValues[rValueCount];
7458
++rValueCount;
7459
}
7460
spvArgs.push_back(arg);
7461
}
7462
7463
// 3. Make the call.
7464
spv::Id result = builder.createFunctionCall(function, spvArgs);
7465
builder.setPrecision(result, TranslatePrecisionDecoration(node->getType()));
7466
builder.addDecoration(result, TranslateNonUniformDecoration(node->getType().getQualifier()));
7467
7468
// 4. Copy back out an "out" arguments.
7469
lValueCount = 0;
7470
for (int a = 0; a < (int)glslangArgs.size(); ++a) {
7471
if (originalParam(qualifiers[a], *argTypes[a], function->hasImplicitThis() && a == 0))
7472
++lValueCount;
7473
else if (writableParam(qualifiers[a])) {
7474
if (qualifiers[a] == glslang::EvqOut || qualifiers[a] == glslang::EvqInOut) {
7475
spv::Id copy = builder.createLoad(spvArgs[a], spv::NoPrecision);
7476
builder.addDecoration(copy, TranslateNonUniformDecoration(argTypes[a]->getQualifier()));
7477
builder.setAccessChain(lValues[lValueCount]);
7478
multiTypeStore(*argTypes[a], copy);
7479
}
7480
++lValueCount;
7481
}
7482
}
7483
7484
return result;
7485
}
7486
7487
// Translate AST operation to SPV operation, already having SPV-based operands/types.
7488
spv::Id TGlslangToSpvTraverser::createBinaryOperation(glslang::TOperator op, OpDecorations& decorations,
7489
spv::Id typeId, spv::Id left, spv::Id right,
7490
glslang::TBasicType typeProxy, bool reduceComparison)
7491
{
7492
bool isUnsigned = isTypeUnsignedInt(typeProxy);
7493
bool isFloat = isTypeFloat(typeProxy);
7494
bool isBool = typeProxy == glslang::EbtBool;
7495
7496
spv::Op binOp = spv::Op::OpNop;
7497
bool needMatchingVectors = true; // for non-matrix ops, would a scalar need to smear to match a vector?
7498
bool comparison = false;
7499
7500
switch (op) {
7501
case glslang::EOpAdd:
7502
case glslang::EOpAddAssign:
7503
if (isFloat)
7504
binOp = spv::Op::OpFAdd;
7505
else
7506
binOp = spv::Op::OpIAdd;
7507
break;
7508
case glslang::EOpSub:
7509
case glslang::EOpSubAssign:
7510
if (isFloat)
7511
binOp = spv::Op::OpFSub;
7512
else
7513
binOp = spv::Op::OpISub;
7514
break;
7515
case glslang::EOpMul:
7516
case glslang::EOpMulAssign:
7517
if (isFloat)
7518
binOp = spv::Op::OpFMul;
7519
else
7520
binOp = spv::Op::OpIMul;
7521
break;
7522
case glslang::EOpVectorTimesScalar:
7523
case glslang::EOpVectorTimesScalarAssign:
7524
if (isFloat && (builder.isVector(left) || builder.isVector(right) || builder.isCooperativeVector(left) || builder.isCooperativeVector(right))) {
7525
if (builder.isVector(right) || builder.isCooperativeVector(right))
7526
std::swap(left, right);
7527
assert(builder.isScalar(right));
7528
needMatchingVectors = false;
7529
binOp = spv::Op::OpVectorTimesScalar;
7530
} else if (isFloat) {
7531
binOp = spv::Op::OpFMul;
7532
} else if (builder.isCooperativeVector(left) || builder.isCooperativeVector(right)) {
7533
if (builder.isCooperativeVector(right))
7534
std::swap(left, right);
7535
assert(builder.isScalar(right));
7536
// Construct a cooperative vector from the scalar
7537
right = builder.createCompositeConstruct(builder.getTypeId(left), { right });
7538
binOp = spv::Op::OpIMul;
7539
} else {
7540
binOp = spv::Op::OpIMul;
7541
}
7542
break;
7543
case glslang::EOpVectorTimesMatrix:
7544
case glslang::EOpVectorTimesMatrixAssign:
7545
binOp = spv::Op::OpVectorTimesMatrix;
7546
break;
7547
case glslang::EOpMatrixTimesVector:
7548
binOp = spv::Op::OpMatrixTimesVector;
7549
break;
7550
case glslang::EOpMatrixTimesScalar:
7551
case glslang::EOpMatrixTimesScalarAssign:
7552
binOp = spv::Op::OpMatrixTimesScalar;
7553
break;
7554
case glslang::EOpMatrixTimesMatrix:
7555
case glslang::EOpMatrixTimesMatrixAssign:
7556
binOp = spv::Op::OpMatrixTimesMatrix;
7557
break;
7558
case glslang::EOpOuterProduct:
7559
binOp = spv::Op::OpOuterProduct;
7560
needMatchingVectors = false;
7561
break;
7562
7563
case glslang::EOpDiv:
7564
case glslang::EOpDivAssign:
7565
if (isFloat)
7566
binOp = spv::Op::OpFDiv;
7567
else if (isUnsigned)
7568
binOp = spv::Op::OpUDiv;
7569
else
7570
binOp = spv::Op::OpSDiv;
7571
break;
7572
case glslang::EOpMod:
7573
case glslang::EOpModAssign:
7574
if (isFloat)
7575
binOp = spv::Op::OpFMod;
7576
else if (isUnsigned)
7577
binOp = spv::Op::OpUMod;
7578
else
7579
binOp = spv::Op::OpSMod;
7580
break;
7581
case glslang::EOpRightShift:
7582
case glslang::EOpRightShiftAssign:
7583
if (isUnsigned)
7584
binOp = spv::Op::OpShiftRightLogical;
7585
else
7586
binOp = spv::Op::OpShiftRightArithmetic;
7587
break;
7588
case glslang::EOpLeftShift:
7589
case glslang::EOpLeftShiftAssign:
7590
binOp = spv::Op::OpShiftLeftLogical;
7591
break;
7592
case glslang::EOpAnd:
7593
case glslang::EOpAndAssign:
7594
binOp = spv::Op::OpBitwiseAnd;
7595
break;
7596
case glslang::EOpLogicalAnd:
7597
needMatchingVectors = false;
7598
binOp = spv::Op::OpLogicalAnd;
7599
break;
7600
case glslang::EOpInclusiveOr:
7601
case glslang::EOpInclusiveOrAssign:
7602
binOp = spv::Op::OpBitwiseOr;
7603
break;
7604
case glslang::EOpLogicalOr:
7605
needMatchingVectors = false;
7606
binOp = spv::Op::OpLogicalOr;
7607
break;
7608
case glslang::EOpExclusiveOr:
7609
case glslang::EOpExclusiveOrAssign:
7610
binOp = spv::Op::OpBitwiseXor;
7611
break;
7612
case glslang::EOpLogicalXor:
7613
needMatchingVectors = false;
7614
binOp = spv::Op::OpLogicalNotEqual;
7615
break;
7616
7617
case glslang::EOpAbsDifference:
7618
binOp = isUnsigned ? spv::Op::OpAbsUSubINTEL : spv::Op::OpAbsISubINTEL;
7619
break;
7620
7621
case glslang::EOpAddSaturate:
7622
binOp = isUnsigned ? spv::Op::OpUAddSatINTEL : spv::Op::OpIAddSatINTEL;
7623
break;
7624
7625
case glslang::EOpSubSaturate:
7626
binOp = isUnsigned ? spv::Op::OpUSubSatINTEL : spv::Op::OpISubSatINTEL;
7627
break;
7628
7629
case glslang::EOpAverage:
7630
binOp = isUnsigned ? spv::Op::OpUAverageINTEL : spv::Op::OpIAverageINTEL;
7631
break;
7632
7633
case glslang::EOpAverageRounded:
7634
binOp = isUnsigned ? spv::Op::OpUAverageRoundedINTEL : spv::Op::OpIAverageRoundedINTEL;
7635
break;
7636
7637
case glslang::EOpMul32x16:
7638
binOp = isUnsigned ? spv::Op::OpUMul32x16INTEL : spv::Op::OpIMul32x16INTEL;
7639
break;
7640
7641
case glslang::EOpExpectEXT:
7642
binOp = spv::Op::OpExpectKHR;
7643
break;
7644
7645
case glslang::EOpLessThan:
7646
case glslang::EOpGreaterThan:
7647
case glslang::EOpLessThanEqual:
7648
case glslang::EOpGreaterThanEqual:
7649
case glslang::EOpEqual:
7650
case glslang::EOpNotEqual:
7651
case glslang::EOpVectorEqual:
7652
case glslang::EOpVectorNotEqual:
7653
comparison = true;
7654
break;
7655
default:
7656
break;
7657
}
7658
7659
// handle mapped binary operations (should be non-comparison)
7660
if (binOp != spv::Op::OpNop) {
7661
assert(comparison == false);
7662
if (builder.isMatrix(left) || builder.isMatrix(right) ||
7663
builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))
7664
return createBinaryMatrixOperation(binOp, decorations, typeId, left, right);
7665
7666
// No matrix involved; make both operands be the same number of components, if needed
7667
if (needMatchingVectors)
7668
builder.promoteScalar(decorations.precision, left, right);
7669
7670
spv::Id result = builder.createBinOp(binOp, typeId, left, right);
7671
decorations.addNoContraction(builder, result);
7672
decorations.addNonUniform(builder, result);
7673
return builder.setPrecision(result, decorations.precision);
7674
}
7675
7676
if (! comparison)
7677
return 0;
7678
7679
// Handle comparison instructions
7680
7681
if (reduceComparison && (op == glslang::EOpEqual || op == glslang::EOpNotEqual)
7682
&& (builder.isVector(left) || builder.isMatrix(left) || builder.isAggregate(left))) {
7683
spv::Id result = builder.createCompositeCompare(decorations.precision, left, right, op == glslang::EOpEqual);
7684
decorations.addNonUniform(builder, result);
7685
return result;
7686
}
7687
7688
switch (op) {
7689
case glslang::EOpLessThan:
7690
if (isFloat)
7691
binOp = spv::Op::OpFOrdLessThan;
7692
else if (isUnsigned)
7693
binOp = spv::Op::OpULessThan;
7694
else
7695
binOp = spv::Op::OpSLessThan;
7696
break;
7697
case glslang::EOpGreaterThan:
7698
if (isFloat)
7699
binOp = spv::Op::OpFOrdGreaterThan;
7700
else if (isUnsigned)
7701
binOp = spv::Op::OpUGreaterThan;
7702
else
7703
binOp = spv::Op::OpSGreaterThan;
7704
break;
7705
case glslang::EOpLessThanEqual:
7706
if (isFloat)
7707
binOp = spv::Op::OpFOrdLessThanEqual;
7708
else if (isUnsigned)
7709
binOp = spv::Op::OpULessThanEqual;
7710
else
7711
binOp = spv::Op::OpSLessThanEqual;
7712
break;
7713
case glslang::EOpGreaterThanEqual:
7714
if (isFloat)
7715
binOp = spv::Op::OpFOrdGreaterThanEqual;
7716
else if (isUnsigned)
7717
binOp = spv::Op::OpUGreaterThanEqual;
7718
else
7719
binOp = spv::Op::OpSGreaterThanEqual;
7720
break;
7721
case glslang::EOpEqual:
7722
case glslang::EOpVectorEqual:
7723
if (isFloat)
7724
binOp = spv::Op::OpFOrdEqual;
7725
else if (isBool)
7726
binOp = spv::Op::OpLogicalEqual;
7727
else
7728
binOp = spv::Op::OpIEqual;
7729
break;
7730
case glslang::EOpNotEqual:
7731
case glslang::EOpVectorNotEqual:
7732
if (isFloat)
7733
binOp = spv::Op::OpFUnordNotEqual;
7734
else if (isBool)
7735
binOp = spv::Op::OpLogicalNotEqual;
7736
else
7737
binOp = spv::Op::OpINotEqual;
7738
break;
7739
default:
7740
break;
7741
}
7742
7743
if (binOp != spv::Op::OpNop) {
7744
spv::Id result = builder.createBinOp(binOp, typeId, left, right);
7745
decorations.addNoContraction(builder, result);
7746
decorations.addNonUniform(builder, result);
7747
return builder.setPrecision(result, decorations.precision);
7748
}
7749
7750
return 0;
7751
}
7752
7753
//
7754
// Translate AST matrix operation to SPV operation, already having SPV-based operands/types.
7755
// These can be any of:
7756
//
7757
// matrix * scalar
7758
// scalar * matrix
7759
// matrix * matrix linear algebraic
7760
// matrix * vector
7761
// vector * matrix
7762
// matrix * matrix componentwise
7763
// matrix op matrix op in {+, -, /}
7764
// matrix op scalar op in {+, -, /}
7765
// scalar op matrix op in {+, -, /}
7766
//
7767
spv::Id TGlslangToSpvTraverser::createBinaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,
7768
spv::Id left, spv::Id right)
7769
{
7770
bool firstClass = true;
7771
7772
// First, handle first-class matrix operations (* and matrix/scalar)
7773
switch (op) {
7774
case spv::Op::OpFDiv:
7775
if (builder.isMatrix(left) && builder.isScalar(right)) {
7776
// turn matrix / scalar into a multiply...
7777
spv::Id resultType = builder.getTypeId(right);
7778
right = builder.createBinOp(spv::Op::OpFDiv, resultType, builder.makeFpConstant(resultType, 1.0), right);
7779
op = spv::Op::OpMatrixTimesScalar;
7780
} else
7781
firstClass = false;
7782
break;
7783
case spv::Op::OpMatrixTimesScalar:
7784
if (builder.isMatrix(right) || builder.isCooperativeMatrix(right))
7785
std::swap(left, right);
7786
assert(builder.isScalar(right));
7787
break;
7788
case spv::Op::OpVectorTimesMatrix:
7789
assert(builder.isVector(left));
7790
assert(builder.isMatrix(right));
7791
break;
7792
case spv::Op::OpMatrixTimesVector:
7793
assert(builder.isMatrix(left));
7794
assert(builder.isVector(right));
7795
break;
7796
case spv::Op::OpMatrixTimesMatrix:
7797
assert(builder.isMatrix(left));
7798
assert(builder.isMatrix(right));
7799
break;
7800
default:
7801
firstClass = false;
7802
break;
7803
}
7804
7805
if (builder.isCooperativeMatrix(left) || builder.isCooperativeMatrix(right))
7806
firstClass = true;
7807
7808
if (firstClass) {
7809
spv::Id result = builder.createBinOp(op, typeId, left, right);
7810
decorations.addNoContraction(builder, result);
7811
decorations.addNonUniform(builder, result);
7812
return builder.setPrecision(result, decorations.precision);
7813
}
7814
7815
// Handle component-wise +, -, *, %, and / for all combinations of type.
7816
// The result type of all of them is the same type as the (a) matrix operand.
7817
// The algorithm is to:
7818
// - break the matrix(es) into vectors
7819
// - smear any scalar to a vector
7820
// - do vector operations
7821
// - make a matrix out the vector results
7822
switch (op) {
7823
case spv::Op::OpFAdd:
7824
case spv::Op::OpFSub:
7825
case spv::Op::OpFDiv:
7826
case spv::Op::OpFMod:
7827
case spv::Op::OpFMul:
7828
{
7829
// one time set up...
7830
bool leftMat = builder.isMatrix(left);
7831
bool rightMat = builder.isMatrix(right);
7832
unsigned int numCols = leftMat ? builder.getNumColumns(left) : builder.getNumColumns(right);
7833
int numRows = leftMat ? builder.getNumRows(left) : builder.getNumRows(right);
7834
spv::Id scalarType = builder.getScalarTypeId(typeId);
7835
spv::Id vecType = builder.makeVectorType(scalarType, numRows);
7836
std::vector<spv::Id> results;
7837
spv::Id smearVec = spv::NoResult;
7838
if (builder.isScalar(left))
7839
smearVec = builder.smearScalar(decorations.precision, left, vecType);
7840
else if (builder.isScalar(right))
7841
smearVec = builder.smearScalar(decorations.precision, right, vecType);
7842
7843
// do each vector op
7844
for (unsigned int c = 0; c < numCols; ++c) {
7845
std::vector<unsigned int> indexes;
7846
indexes.push_back(c);
7847
spv::Id leftVec = leftMat ? builder.createCompositeExtract( left, vecType, indexes) : smearVec;
7848
spv::Id rightVec = rightMat ? builder.createCompositeExtract(right, vecType, indexes) : smearVec;
7849
spv::Id result = builder.createBinOp(op, vecType, leftVec, rightVec);
7850
decorations.addNoContraction(builder, result);
7851
decorations.addNonUniform(builder, result);
7852
results.push_back(builder.setPrecision(result, decorations.precision));
7853
}
7854
7855
// put the pieces together
7856
spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);
7857
decorations.addNonUniform(builder, result);
7858
return result;
7859
}
7860
default:
7861
assert(0);
7862
return spv::NoResult;
7863
}
7864
}
7865
7866
spv::Id TGlslangToSpvTraverser::createUnaryOperation(glslang::TOperator op, OpDecorations& decorations, spv::Id typeId,
7867
spv::Id operand, glslang::TBasicType typeProxy, const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags,
7868
const glslang::TType &opType)
7869
{
7870
spv::Op unaryOp = spv::Op::OpNop;
7871
int extBuiltins = -1;
7872
int libCall = -1;
7873
bool isUnsigned = isTypeUnsignedInt(typeProxy);
7874
bool isFloat = isTypeFloat(typeProxy);
7875
7876
switch (op) {
7877
case glslang::EOpNegative:
7878
if (isFloat) {
7879
unaryOp = spv::Op::OpFNegate;
7880
if (builder.isMatrixType(typeId))
7881
return createUnaryMatrixOperation(unaryOp, decorations, typeId, operand, typeProxy);
7882
} else
7883
unaryOp = spv::Op::OpSNegate;
7884
break;
7885
7886
case glslang::EOpLogicalNot:
7887
case glslang::EOpVectorLogicalNot:
7888
unaryOp = spv::Op::OpLogicalNot;
7889
break;
7890
case glslang::EOpBitwiseNot:
7891
unaryOp = spv::Op::OpNot;
7892
break;
7893
7894
case glslang::EOpDeterminant:
7895
libCall = spv::GLSLstd450Determinant;
7896
break;
7897
case glslang::EOpMatrixInverse:
7898
libCall = spv::GLSLstd450MatrixInverse;
7899
break;
7900
case glslang::EOpTranspose:
7901
unaryOp = spv::Op::OpTranspose;
7902
break;
7903
7904
case glslang::EOpRadians:
7905
libCall = spv::GLSLstd450Radians;
7906
break;
7907
case glslang::EOpDegrees:
7908
libCall = spv::GLSLstd450Degrees;
7909
break;
7910
case glslang::EOpSin:
7911
libCall = spv::GLSLstd450Sin;
7912
break;
7913
case glslang::EOpCos:
7914
libCall = spv::GLSLstd450Cos;
7915
break;
7916
case glslang::EOpTan:
7917
libCall = spv::GLSLstd450Tan;
7918
break;
7919
case glslang::EOpAcos:
7920
libCall = spv::GLSLstd450Acos;
7921
break;
7922
case glslang::EOpAsin:
7923
libCall = spv::GLSLstd450Asin;
7924
break;
7925
case glslang::EOpAtan:
7926
libCall = spv::GLSLstd450Atan;
7927
break;
7928
7929
case glslang::EOpAcosh:
7930
libCall = spv::GLSLstd450Acosh;
7931
break;
7932
case glslang::EOpAsinh:
7933
libCall = spv::GLSLstd450Asinh;
7934
break;
7935
case glslang::EOpAtanh:
7936
libCall = spv::GLSLstd450Atanh;
7937
break;
7938
case glslang::EOpTanh:
7939
libCall = spv::GLSLstd450Tanh;
7940
break;
7941
case glslang::EOpCosh:
7942
libCall = spv::GLSLstd450Cosh;
7943
break;
7944
case glslang::EOpSinh:
7945
libCall = spv::GLSLstd450Sinh;
7946
break;
7947
7948
case glslang::EOpLength:
7949
libCall = spv::GLSLstd450Length;
7950
break;
7951
case glslang::EOpNormalize:
7952
libCall = spv::GLSLstd450Normalize;
7953
break;
7954
7955
case glslang::EOpExp:
7956
libCall = spv::GLSLstd450Exp;
7957
break;
7958
case glslang::EOpLog:
7959
libCall = spv::GLSLstd450Log;
7960
break;
7961
case glslang::EOpExp2:
7962
libCall = spv::GLSLstd450Exp2;
7963
break;
7964
case glslang::EOpLog2:
7965
libCall = spv::GLSLstd450Log2;
7966
break;
7967
case glslang::EOpSqrt:
7968
libCall = spv::GLSLstd450Sqrt;
7969
break;
7970
case glslang::EOpInverseSqrt:
7971
libCall = spv::GLSLstd450InverseSqrt;
7972
break;
7973
7974
case glslang::EOpFloor:
7975
libCall = spv::GLSLstd450Floor;
7976
break;
7977
case glslang::EOpTrunc:
7978
libCall = spv::GLSLstd450Trunc;
7979
break;
7980
case glslang::EOpRound:
7981
libCall = spv::GLSLstd450Round;
7982
break;
7983
case glslang::EOpRoundEven:
7984
libCall = spv::GLSLstd450RoundEven;
7985
break;
7986
case glslang::EOpCeil:
7987
libCall = spv::GLSLstd450Ceil;
7988
break;
7989
case glslang::EOpFract:
7990
libCall = spv::GLSLstd450Fract;
7991
break;
7992
7993
case glslang::EOpIsNan:
7994
unaryOp = spv::Op::OpIsNan;
7995
break;
7996
case glslang::EOpIsInf:
7997
unaryOp = spv::Op::OpIsInf;
7998
break;
7999
case glslang::EOpIsFinite:
8000
unaryOp = spv::Op::OpIsFinite;
8001
break;
8002
8003
case glslang::EOpFloatBitsToInt:
8004
case glslang::EOpFloatBitsToUint:
8005
case glslang::EOpIntBitsToFloat:
8006
case glslang::EOpUintBitsToFloat:
8007
case glslang::EOpDoubleBitsToInt64:
8008
case glslang::EOpDoubleBitsToUint64:
8009
case glslang::EOpInt64BitsToDouble:
8010
case glslang::EOpUint64BitsToDouble:
8011
case glslang::EOpFloat16BitsToInt16:
8012
case glslang::EOpFloat16BitsToUint16:
8013
case glslang::EOpInt16BitsToFloat16:
8014
case glslang::EOpUint16BitsToFloat16:
8015
unaryOp = spv::Op::OpBitcast;
8016
break;
8017
8018
case glslang::EOpPackSnorm2x16:
8019
libCall = spv::GLSLstd450PackSnorm2x16;
8020
break;
8021
case glslang::EOpUnpackSnorm2x16:
8022
libCall = spv::GLSLstd450UnpackSnorm2x16;
8023
break;
8024
case glslang::EOpPackUnorm2x16:
8025
libCall = spv::GLSLstd450PackUnorm2x16;
8026
break;
8027
case glslang::EOpUnpackUnorm2x16:
8028
libCall = spv::GLSLstd450UnpackUnorm2x16;
8029
break;
8030
case glslang::EOpPackHalf2x16:
8031
libCall = spv::GLSLstd450PackHalf2x16;
8032
break;
8033
case glslang::EOpUnpackHalf2x16:
8034
libCall = spv::GLSLstd450UnpackHalf2x16;
8035
break;
8036
case glslang::EOpPackSnorm4x8:
8037
libCall = spv::GLSLstd450PackSnorm4x8;
8038
break;
8039
case glslang::EOpUnpackSnorm4x8:
8040
libCall = spv::GLSLstd450UnpackSnorm4x8;
8041
break;
8042
case glslang::EOpPackUnorm4x8:
8043
libCall = spv::GLSLstd450PackUnorm4x8;
8044
break;
8045
case glslang::EOpUnpackUnorm4x8:
8046
libCall = spv::GLSLstd450UnpackUnorm4x8;
8047
break;
8048
case glslang::EOpPackDouble2x32:
8049
libCall = spv::GLSLstd450PackDouble2x32;
8050
break;
8051
case glslang::EOpUnpackDouble2x32:
8052
libCall = spv::GLSLstd450UnpackDouble2x32;
8053
break;
8054
8055
case glslang::EOpPackInt2x32:
8056
case glslang::EOpUnpackInt2x32:
8057
case glslang::EOpPackUint2x32:
8058
case glslang::EOpUnpackUint2x32:
8059
case glslang::EOpPack16:
8060
case glslang::EOpPack32:
8061
case glslang::EOpPack64:
8062
case glslang::EOpUnpack32:
8063
case glslang::EOpUnpack16:
8064
case glslang::EOpUnpack8:
8065
case glslang::EOpPackInt2x16:
8066
case glslang::EOpUnpackInt2x16:
8067
case glslang::EOpPackUint2x16:
8068
case glslang::EOpUnpackUint2x16:
8069
case glslang::EOpPackInt4x16:
8070
case glslang::EOpUnpackInt4x16:
8071
case glslang::EOpPackUint4x16:
8072
case glslang::EOpUnpackUint4x16:
8073
case glslang::EOpPackFloat2x16:
8074
case glslang::EOpUnpackFloat2x16:
8075
unaryOp = spv::Op::OpBitcast;
8076
break;
8077
8078
case glslang::EOpDPdx:
8079
unaryOp = spv::Op::OpDPdx;
8080
break;
8081
case glslang::EOpDPdy:
8082
unaryOp = spv::Op::OpDPdy;
8083
break;
8084
case glslang::EOpFwidth:
8085
unaryOp = spv::Op::OpFwidth;
8086
break;
8087
8088
case glslang::EOpAny:
8089
unaryOp = spv::Op::OpAny;
8090
break;
8091
case glslang::EOpAll:
8092
unaryOp = spv::Op::OpAll;
8093
break;
8094
8095
case glslang::EOpAbs:
8096
if (isFloat)
8097
libCall = spv::GLSLstd450FAbs;
8098
else
8099
libCall = spv::GLSLstd450SAbs;
8100
break;
8101
case glslang::EOpSign:
8102
if (isFloat)
8103
libCall = spv::GLSLstd450FSign;
8104
else
8105
libCall = spv::GLSLstd450SSign;
8106
break;
8107
8108
case glslang::EOpDPdxFine:
8109
unaryOp = spv::Op::OpDPdxFine;
8110
break;
8111
case glslang::EOpDPdyFine:
8112
unaryOp = spv::Op::OpDPdyFine;
8113
break;
8114
case glslang::EOpFwidthFine:
8115
unaryOp = spv::Op::OpFwidthFine;
8116
break;
8117
case glslang::EOpDPdxCoarse:
8118
unaryOp = spv::Op::OpDPdxCoarse;
8119
break;
8120
case glslang::EOpDPdyCoarse:
8121
unaryOp = spv::Op::OpDPdyCoarse;
8122
break;
8123
case glslang::EOpFwidthCoarse:
8124
unaryOp = spv::Op::OpFwidthCoarse;
8125
break;
8126
case glslang::EOpRayQueryProceed:
8127
unaryOp = spv::Op::OpRayQueryProceedKHR;
8128
break;
8129
case glslang::EOpRayQueryGetRayTMin:
8130
unaryOp = spv::Op::OpRayQueryGetRayTMinKHR;
8131
break;
8132
case glslang::EOpRayQueryGetRayFlags:
8133
unaryOp = spv::Op::OpRayQueryGetRayFlagsKHR;
8134
break;
8135
case glslang::EOpRayQueryGetWorldRayOrigin:
8136
unaryOp = spv::Op::OpRayQueryGetWorldRayOriginKHR;
8137
break;
8138
case glslang::EOpRayQueryGetWorldRayDirection:
8139
unaryOp = spv::Op::OpRayQueryGetWorldRayDirectionKHR;
8140
break;
8141
case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
8142
unaryOp = spv::Op::OpRayQueryGetIntersectionCandidateAABBOpaqueKHR;
8143
break;
8144
case glslang::EOpInterpolateAtCentroid:
8145
if (typeProxy == glslang::EbtFloat16)
8146
builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
8147
libCall = spv::GLSLstd450InterpolateAtCentroid;
8148
break;
8149
case glslang::EOpAtomicCounterIncrement:
8150
case glslang::EOpAtomicCounterDecrement:
8151
case glslang::EOpAtomicCounter:
8152
{
8153
// Handle all of the atomics in one place, in createAtomicOperation()
8154
std::vector<spv::Id> operands;
8155
operands.push_back(operand);
8156
return createAtomicOperation(op, decorations.precision, typeId, operands, typeProxy, lvalueCoherentFlags, opType);
8157
}
8158
8159
case glslang::EOpBitFieldReverse:
8160
unaryOp = spv::Op::OpBitReverse;
8161
break;
8162
case glslang::EOpBitCount:
8163
unaryOp = spv::Op::OpBitCount;
8164
break;
8165
case glslang::EOpFindLSB:
8166
libCall = spv::GLSLstd450FindILsb;
8167
break;
8168
case glslang::EOpFindMSB:
8169
if (isUnsigned)
8170
libCall = spv::GLSLstd450FindUMsb;
8171
else
8172
libCall = spv::GLSLstd450FindSMsb;
8173
break;
8174
8175
case glslang::EOpCountLeadingZeros:
8176
builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
8177
builder.addExtension("SPV_INTEL_shader_integer_functions2");
8178
unaryOp = spv::Op::OpUCountLeadingZerosINTEL;
8179
break;
8180
8181
case glslang::EOpCountTrailingZeros:
8182
builder.addCapability(spv::Capability::IntegerFunctions2INTEL);
8183
builder.addExtension("SPV_INTEL_shader_integer_functions2");
8184
unaryOp = spv::Op::OpUCountTrailingZerosINTEL;
8185
break;
8186
8187
case glslang::EOpBallot:
8188
case glslang::EOpReadFirstInvocation:
8189
case glslang::EOpAnyInvocation:
8190
case glslang::EOpAllInvocations:
8191
case glslang::EOpAllInvocationsEqual:
8192
case glslang::EOpMinInvocations:
8193
case glslang::EOpMaxInvocations:
8194
case glslang::EOpAddInvocations:
8195
case glslang::EOpMinInvocationsNonUniform:
8196
case glslang::EOpMaxInvocationsNonUniform:
8197
case glslang::EOpAddInvocationsNonUniform:
8198
case glslang::EOpMinInvocationsInclusiveScan:
8199
case glslang::EOpMaxInvocationsInclusiveScan:
8200
case glslang::EOpAddInvocationsInclusiveScan:
8201
case glslang::EOpMinInvocationsInclusiveScanNonUniform:
8202
case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
8203
case glslang::EOpAddInvocationsInclusiveScanNonUniform:
8204
case glslang::EOpMinInvocationsExclusiveScan:
8205
case glslang::EOpMaxInvocationsExclusiveScan:
8206
case glslang::EOpAddInvocationsExclusiveScan:
8207
case glslang::EOpMinInvocationsExclusiveScanNonUniform:
8208
case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
8209
case glslang::EOpAddInvocationsExclusiveScanNonUniform:
8210
{
8211
std::vector<spv::Id> operands;
8212
operands.push_back(operand);
8213
return createInvocationsOperation(op, typeId, operands, typeProxy);
8214
}
8215
case glslang::EOpSubgroupAll:
8216
case glslang::EOpSubgroupAny:
8217
case glslang::EOpSubgroupAllEqual:
8218
case glslang::EOpSubgroupBroadcastFirst:
8219
case glslang::EOpSubgroupBallot:
8220
case glslang::EOpSubgroupInverseBallot:
8221
case glslang::EOpSubgroupBallotBitCount:
8222
case glslang::EOpSubgroupBallotInclusiveBitCount:
8223
case glslang::EOpSubgroupBallotExclusiveBitCount:
8224
case glslang::EOpSubgroupBallotFindLSB:
8225
case glslang::EOpSubgroupBallotFindMSB:
8226
case glslang::EOpSubgroupAdd:
8227
case glslang::EOpSubgroupMul:
8228
case glslang::EOpSubgroupMin:
8229
case glslang::EOpSubgroupMax:
8230
case glslang::EOpSubgroupAnd:
8231
case glslang::EOpSubgroupOr:
8232
case glslang::EOpSubgroupXor:
8233
case glslang::EOpSubgroupInclusiveAdd:
8234
case glslang::EOpSubgroupInclusiveMul:
8235
case glslang::EOpSubgroupInclusiveMin:
8236
case glslang::EOpSubgroupInclusiveMax:
8237
case glslang::EOpSubgroupInclusiveAnd:
8238
case glslang::EOpSubgroupInclusiveOr:
8239
case glslang::EOpSubgroupInclusiveXor:
8240
case glslang::EOpSubgroupExclusiveAdd:
8241
case glslang::EOpSubgroupExclusiveMul:
8242
case glslang::EOpSubgroupExclusiveMin:
8243
case glslang::EOpSubgroupExclusiveMax:
8244
case glslang::EOpSubgroupExclusiveAnd:
8245
case glslang::EOpSubgroupExclusiveOr:
8246
case glslang::EOpSubgroupExclusiveXor:
8247
case glslang::EOpSubgroupQuadSwapHorizontal:
8248
case glslang::EOpSubgroupQuadSwapVertical:
8249
case glslang::EOpSubgroupQuadSwapDiagonal:
8250
case glslang::EOpSubgroupQuadAll:
8251
case glslang::EOpSubgroupQuadAny: {
8252
std::vector<spv::Id> operands;
8253
operands.push_back(operand);
8254
return createSubgroupOperation(op, typeId, operands, typeProxy);
8255
}
8256
case glslang::EOpMbcnt:
8257
extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
8258
libCall = spv::MbcntAMD;
8259
break;
8260
8261
case glslang::EOpCubeFaceIndex:
8262
extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);
8263
libCall = spv::CubeFaceIndexAMD;
8264
break;
8265
8266
case glslang::EOpCubeFaceCoord:
8267
extBuiltins = getExtBuiltins(spv::E_SPV_AMD_gcn_shader);
8268
libCall = spv::CubeFaceCoordAMD;
8269
break;
8270
case glslang::EOpSubgroupPartition:
8271
unaryOp = spv::Op::OpGroupNonUniformPartitionNV;
8272
break;
8273
case glslang::EOpConstructReference:
8274
unaryOp = spv::Op::OpBitcast;
8275
break;
8276
8277
case glslang::EOpConvUint64ToAccStruct:
8278
case glslang::EOpConvUvec2ToAccStruct:
8279
unaryOp = spv::Op::OpConvertUToAccelerationStructureKHR;
8280
break;
8281
8282
case glslang::EOpHitObjectIsEmptyNV:
8283
unaryOp = spv::Op::OpHitObjectIsEmptyNV;
8284
break;
8285
8286
case glslang::EOpHitObjectIsEmptyEXT:
8287
unaryOp = spv::Op::OpHitObjectIsEmptyEXT;
8288
break;
8289
8290
case glslang::EOpHitObjectIsMissNV:
8291
unaryOp = spv::Op::OpHitObjectIsMissNV;
8292
break;
8293
8294
case glslang::EOpHitObjectIsMissEXT:
8295
unaryOp = spv::Op::OpHitObjectIsMissEXT;
8296
break;
8297
8298
case glslang::EOpHitObjectIsHitNV:
8299
unaryOp = spv::Op::OpHitObjectIsHitNV;
8300
break;
8301
8302
case glslang::EOpHitObjectIsHitEXT:
8303
unaryOp = spv::Op::OpHitObjectIsHitEXT;
8304
break;
8305
8306
case glslang::EOpHitObjectGetObjectRayOriginNV:
8307
unaryOp = spv::Op::OpHitObjectGetObjectRayOriginNV;
8308
break;
8309
8310
case glslang::EOpHitObjectGetObjectRayOriginEXT:
8311
unaryOp = spv::Op::OpHitObjectGetObjectRayOriginEXT;
8312
break;
8313
8314
case glslang::EOpHitObjectGetObjectRayDirectionNV:
8315
unaryOp = spv::Op::OpHitObjectGetObjectRayDirectionNV;
8316
break;
8317
8318
case glslang::EOpHitObjectGetObjectRayDirectionEXT:
8319
unaryOp = spv::Op::OpHitObjectGetObjectRayDirectionEXT;
8320
break;
8321
8322
case glslang::EOpHitObjectGetWorldRayOriginNV:
8323
unaryOp = spv::Op::OpHitObjectGetWorldRayOriginNV;
8324
break;
8325
8326
case glslang::EOpHitObjectGetWorldRayOriginEXT:
8327
unaryOp = spv::Op::OpHitObjectGetWorldRayOriginEXT;
8328
break;
8329
8330
case glslang::EOpHitObjectGetWorldRayDirectionNV:
8331
unaryOp = spv::Op::OpHitObjectGetWorldRayDirectionNV;
8332
break;
8333
8334
case glslang::EOpHitObjectGetWorldRayDirectionEXT:
8335
unaryOp = spv::Op::OpHitObjectGetWorldRayDirectionEXT;
8336
break;
8337
8338
case glslang::EOpHitObjectGetObjectToWorldNV:
8339
unaryOp = spv::Op::OpHitObjectGetObjectToWorldNV;
8340
break;
8341
8342
case glslang::EOpHitObjectGetObjectToWorldEXT:
8343
unaryOp = spv::Op::OpHitObjectGetObjectToWorldEXT;
8344
break;
8345
8346
case glslang::EOpHitObjectGetWorldToObjectNV:
8347
unaryOp = spv::Op::OpHitObjectGetWorldToObjectNV;
8348
break;
8349
8350
case glslang::EOpHitObjectGetWorldToObjectEXT:
8351
unaryOp = spv::Op::OpHitObjectGetWorldToObjectEXT;
8352
break;
8353
8354
case glslang::EOpHitObjectGetRayTMinNV:
8355
unaryOp = spv::Op::OpHitObjectGetRayTMinNV;
8356
break;
8357
8358
case glslang::EOpHitObjectGetRayTMinEXT:
8359
unaryOp = spv::Op::OpHitObjectGetRayTMinEXT;
8360
break;
8361
8362
case glslang::EOpHitObjectGetRayTMaxNV:
8363
unaryOp = spv::Op::OpHitObjectGetRayTMaxNV;
8364
break;
8365
8366
case glslang::EOpHitObjectGetRayTMaxEXT:
8367
unaryOp = spv::Op::OpHitObjectGetRayTMaxEXT;
8368
break;
8369
8370
case glslang::EOpHitObjectGetRayFlagsEXT:
8371
unaryOp = spv::Op::OpHitObjectGetRayFlagsEXT;
8372
break;
8373
8374
case glslang::EOpHitObjectGetPrimitiveIndexNV:
8375
unaryOp = spv::Op::OpHitObjectGetPrimitiveIndexNV;
8376
break;
8377
8378
case glslang::EOpHitObjectGetPrimitiveIndexEXT:
8379
unaryOp = spv::Op::OpHitObjectGetPrimitiveIndexEXT;
8380
break;
8381
8382
case glslang::EOpHitObjectGetInstanceIdNV:
8383
unaryOp = spv::Op::OpHitObjectGetInstanceIdNV;
8384
break;
8385
8386
case glslang::EOpHitObjectGetInstanceIdEXT:
8387
unaryOp = spv::Op::OpHitObjectGetInstanceIdEXT;
8388
break;
8389
8390
case glslang::EOpHitObjectGetInstanceCustomIndexNV:
8391
unaryOp = spv::Op::OpHitObjectGetInstanceCustomIndexNV;
8392
break;
8393
8394
case glslang::EOpHitObjectGetInstanceCustomIndexEXT:
8395
unaryOp = spv::Op::OpHitObjectGetInstanceCustomIndexEXT;
8396
break;
8397
8398
case glslang::EOpHitObjectGetGeometryIndexNV:
8399
unaryOp = spv::Op::OpHitObjectGetGeometryIndexNV;
8400
break;
8401
8402
case glslang::EOpHitObjectGetGeometryIndexEXT:
8403
unaryOp = spv::Op::OpHitObjectGetGeometryIndexEXT;
8404
break;
8405
8406
case glslang::EOpHitObjectGetHitKindNV:
8407
unaryOp = spv::Op::OpHitObjectGetHitKindNV;
8408
break;
8409
8410
case glslang::EOpHitObjectGetHitKindEXT:
8411
unaryOp = spv::Op::OpHitObjectGetHitKindEXT;
8412
break;
8413
8414
case glslang::EOpHitObjectGetCurrentTimeNV:
8415
unaryOp = spv::Op::OpHitObjectGetCurrentTimeNV;
8416
break;
8417
8418
case glslang::EOpHitObjectGetCurrentTimeEXT:
8419
unaryOp = spv::Op::OpHitObjectGetCurrentTimeEXT;
8420
break;
8421
8422
case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
8423
unaryOp = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexNV;
8424
break;
8425
8426
case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:
8427
unaryOp = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexEXT;
8428
break;
8429
8430
case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
8431
unaryOp = spv::Op::OpHitObjectGetShaderRecordBufferHandleNV;
8432
break;
8433
8434
case glslang::EOpHitObjectGetClusterIdNV:
8435
unaryOp = spv::Op::OpHitObjectGetClusterIdNV;
8436
builder.addExtension(spv::E_SPV_NV_cluster_acceleration_structure);
8437
builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
8438
builder.addCapability(spv::Capability::RayTracingClusterAccelerationStructureNV);
8439
break;
8440
8441
case glslang::EOpHitObjectGetSpherePositionNV:
8442
unaryOp = spv::Op::OpHitObjectGetSpherePositionNV;
8443
builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
8444
builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
8445
builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
8446
break;
8447
8448
case glslang::EOpHitObjectGetSphereRadiusNV:
8449
unaryOp = spv::Op::OpHitObjectGetSphereRadiusNV;
8450
builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
8451
builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
8452
builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
8453
break;
8454
8455
case glslang::EOpHitObjectIsSphereHitNV:
8456
unaryOp = spv::Op::OpHitObjectIsSphereHitNV;
8457
builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
8458
builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
8459
builder.addCapability(spv::Capability::RayTracingSpheresGeometryNV);
8460
break;
8461
8462
case glslang::EOpHitObjectIsLSSHitNV:
8463
unaryOp = spv::Op::OpHitObjectIsLSSHitNV;
8464
builder.addExtension(spv::E_SPV_NV_linear_swept_spheres);
8465
builder.addCapability(spv::Capability::ShaderInvocationReorderNV);
8466
builder.addCapability(spv::Capability::RayTracingLinearSweptSpheresGeometryNV);
8467
break;
8468
8469
case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:
8470
unaryOp = spv::Op::OpHitObjectGetShaderRecordBufferHandleEXT;
8471
break;
8472
8473
case glslang::EOpFetchMicroTriangleVertexPositionNV:
8474
unaryOp = spv::Op::OpFetchMicroTriangleVertexPositionNV;
8475
break;
8476
8477
case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
8478
unaryOp = spv::Op::OpFetchMicroTriangleVertexBarycentricNV;
8479
break;
8480
8481
case glslang::EOpCopyObject:
8482
unaryOp = spv::Op::OpCopyObject;
8483
break;
8484
8485
case glslang::EOpDepthAttachmentReadEXT:
8486
builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
8487
builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
8488
unaryOp = spv::Op::OpDepthAttachmentReadEXT;
8489
decorations.precision = spv::NoPrecision;
8490
break;
8491
case glslang::EOpStencilAttachmentReadEXT:
8492
builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
8493
builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
8494
unaryOp = spv::Op::OpStencilAttachmentReadEXT;
8495
decorations.precision = spv::Decoration::RelaxedPrecision;
8496
break;
8497
8498
default:
8499
return 0;
8500
}
8501
8502
spv::Id id;
8503
if (libCall >= 0) {
8504
std::vector<spv::Id> args;
8505
args.push_back(operand);
8506
id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, args);
8507
} else {
8508
id = builder.createUnaryOp(unaryOp, typeId, operand);
8509
}
8510
8511
decorations.addNoContraction(builder, id);
8512
decorations.addNonUniform(builder, id);
8513
return builder.setPrecision(id, decorations.precision);
8514
}
8515
8516
// Create a unary operation on a matrix
8517
spv::Id TGlslangToSpvTraverser::createUnaryMatrixOperation(spv::Op op, OpDecorations& decorations, spv::Id typeId,
8518
spv::Id operand, glslang::TBasicType /* typeProxy */)
8519
{
8520
// Handle unary operations vector by vector.
8521
// The result type is the same type as the original type.
8522
// The algorithm is to:
8523
// - break the matrix into vectors
8524
// - apply the operation to each vector
8525
// - make a matrix out the vector results
8526
8527
// get the types sorted out
8528
int numCols = builder.getNumColumns(operand);
8529
int numRows = builder.getNumRows(operand);
8530
spv::Id srcVecType = builder.makeVectorType(builder.getScalarTypeId(builder.getTypeId(operand)), numRows);
8531
spv::Id destVecType = builder.makeVectorType(builder.getScalarTypeId(typeId), numRows);
8532
std::vector<spv::Id> results;
8533
8534
// do each vector op
8535
for (int c = 0; c < numCols; ++c) {
8536
std::vector<unsigned int> indexes;
8537
indexes.push_back(c);
8538
spv::Id srcVec = builder.createCompositeExtract(operand, srcVecType, indexes);
8539
spv::Id destVec = builder.createUnaryOp(op, destVecType, srcVec);
8540
decorations.addNoContraction(builder, destVec);
8541
decorations.addNonUniform(builder, destVec);
8542
results.push_back(builder.setPrecision(destVec, decorations.precision));
8543
}
8544
8545
// put the pieces together
8546
spv::Id result = builder.setPrecision(builder.createCompositeConstruct(typeId, results), decorations.precision);
8547
decorations.addNonUniform(builder, result);
8548
return result;
8549
}
8550
8551
// For converting integers where both the bitwidth and the signedness could
8552
// change, but only do the width change here. The caller is still responsible
8553
// for the signedness conversion.
8554
// destType is the final type that will be converted to, but this function
8555
// may only be doing part of that conversion.
8556
spv::Id TGlslangToSpvTraverser::createIntWidthConversion(spv::Id operand, int vectorSize, spv::Id destType,
8557
glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType)
8558
{
8559
// Get the result type width, based on the type to convert to.
8560
int width = GetNumBits(resultBasicType);
8561
8562
// Get the conversion operation and result type,
8563
// based on the target width, but the source type.
8564
spv::Id type = spv::NoType;
8565
spv::Op convOp = spv::Op::OpNop;
8566
if (isTypeSignedInt(operandBasicType)) {
8567
convOp = spv::Op::OpSConvert;
8568
type = builder.makeIntType(width);
8569
} else {
8570
convOp = spv::Op::OpUConvert;
8571
type = builder.makeUintType(width);
8572
}
8573
8574
if (builder.getOpCode(destType) == spv::Op::OpTypeCooperativeVectorNV) {
8575
type = builder.makeCooperativeVectorTypeNV(type, builder.getCooperativeVectorNumComponents(destType));
8576
} else if (vectorSize > 0)
8577
type = builder.makeVectorType(type, vectorSize);
8578
else if (builder.getOpCode(destType) == spv::Op::OpTypeCooperativeMatrixKHR ||
8579
builder.getOpCode(destType) == spv::Op::OpTypeCooperativeMatrixNV) {
8580
8581
type = builder.makeCooperativeMatrixTypeWithSameShape(type, destType);
8582
}
8583
8584
return builder.createUnaryOp(convOp, type, operand);
8585
}
8586
8587
spv::Id TGlslangToSpvTraverser::createConversion(glslang::TOperator op, OpDecorations& decorations, spv::Id destType,
8588
spv::Id operand, glslang::TBasicType resultBasicType, glslang::TBasicType operandBasicType)
8589
{
8590
spv::Op convOp = spv::Op::OpNop;
8591
spv::Id zero = 0;
8592
spv::Id one = 0;
8593
8594
int vectorSize = builder.isVectorType(destType) ? builder.getNumTypeComponents(destType) : 0;
8595
8596
if (IsOpNumericConv(op) || op == glslang::EOpConstructSaturated) {
8597
if (isTypeSignedInt(operandBasicType) && isTypeFloat(resultBasicType)) {
8598
convOp = spv::Op::OpConvertSToF;
8599
}
8600
if (isTypeUnsignedInt(operandBasicType) && isTypeFloat(resultBasicType)) {
8601
convOp = spv::Op::OpConvertUToF;
8602
}
8603
if (isTypeFloat(operandBasicType) && isTypeSignedInt(resultBasicType)) {
8604
convOp = spv::Op::OpConvertFToS;
8605
}
8606
if (isTypeFloat(operandBasicType) && isTypeUnsignedInt(resultBasicType)) {
8607
convOp = spv::Op::OpConvertFToU;
8608
}
8609
if (isTypeSignedInt(operandBasicType) && isTypeSignedInt(resultBasicType)) {
8610
convOp = spv::Op::OpSConvert;
8611
}
8612
if (isTypeUnsignedInt(operandBasicType) && isTypeUnsignedInt(resultBasicType)) {
8613
convOp = spv::Op::OpUConvert;
8614
}
8615
if (isTypeFloat(operandBasicType) && isTypeFloat(resultBasicType)) {
8616
convOp = spv::Op::OpFConvert;
8617
if (builder.isMatrixType(destType))
8618
return createUnaryMatrixOperation(convOp, decorations, destType, operand, operandBasicType);
8619
}
8620
if (isTypeInt(operandBasicType) && isTypeInt(resultBasicType) &&
8621
isTypeUnsignedInt(operandBasicType) != isTypeUnsignedInt(resultBasicType)) {
8622
8623
if (GetNumBits(operandBasicType) != GetNumBits(resultBasicType)) {
8624
// OpSConvert/OpUConvert + OpBitCast
8625
operand = createIntWidthConversion(operand, vectorSize, destType, resultBasicType, operandBasicType);
8626
}
8627
8628
if (builder.isInSpecConstCodeGenMode()) {
8629
uint32_t bits = GetNumBits(resultBasicType);
8630
spv::Id zeroType = builder.makeUintType(bits);
8631
if (bits == 64) {
8632
zero = builder.makeInt64Constant(zeroType, 0, false);
8633
} else {
8634
zero = builder.makeIntConstant(zeroType, 0, false);
8635
}
8636
zero = makeSmearedConstant(zero, vectorSize);
8637
// Use OpIAdd, instead of OpBitcast to do the conversion when
8638
// generating for OpSpecConstantOp instruction.
8639
return builder.createBinOp(spv::Op::OpIAdd, destType, operand, zero);
8640
}
8641
// For normal run-time conversion instruction, use OpBitcast.
8642
convOp = spv::Op::OpBitcast;
8643
}
8644
if (resultBasicType == glslang::EbtBool) {
8645
uint32_t bits = GetNumBits(operandBasicType);
8646
if (isTypeInt(operandBasicType)) {
8647
spv::Id zeroType = builder.makeUintType(bits);
8648
if (bits == 64) {
8649
zero = builder.makeInt64Constant(zeroType, 0, false);
8650
} else {
8651
zero = builder.makeIntConstant(zeroType, 0, false);
8652
}
8653
zero = makeSmearedConstant(zero, vectorSize);
8654
return builder.createBinOp(spv::Op::OpINotEqual, destType, operand, zero);
8655
} else {
8656
assert(isTypeFloat(operandBasicType));
8657
if (bits == 64) {
8658
zero = builder.makeDoubleConstant(0.0);
8659
} else if (bits == 32) {
8660
zero = builder.makeFloatConstant(0.0);
8661
} else {
8662
assert(bits == 16);
8663
zero = builder.makeFloat16Constant(0.0);
8664
}
8665
zero = makeSmearedConstant(zero, vectorSize);
8666
return builder.createBinOp(spv::Op::OpFUnordNotEqual, destType, operand, zero);
8667
}
8668
}
8669
if (operandBasicType == glslang::EbtBool) {
8670
uint32_t bits = GetNumBits(resultBasicType);
8671
convOp = spv::Op::OpSelect;
8672
if (isTypeInt(resultBasicType)) {
8673
spv::Id zeroType = isTypeSignedInt(resultBasicType) ? builder.makeIntType(bits) : builder.makeUintType(bits);
8674
if (bits == 64) {
8675
zero = builder.makeInt64Constant(zeroType, 0, false);
8676
one = builder.makeInt64Constant(zeroType, 1, false);
8677
} else {
8678
zero = builder.makeIntConstant(zeroType, 0, false);
8679
one = builder.makeIntConstant(zeroType, 1, false);
8680
}
8681
} else {
8682
assert(isTypeFloat(resultBasicType));
8683
if (bits == 64) {
8684
zero = builder.makeDoubleConstant(0.0);
8685
one = builder.makeDoubleConstant(1.0);
8686
} else if (bits == 32) {
8687
zero = builder.makeFloatConstant(0.0);
8688
one = builder.makeFloatConstant(1.0);
8689
} else {
8690
assert(bits == 16);
8691
zero = builder.makeFloat16Constant(0.0);
8692
one = builder.makeFloat16Constant(1.0);
8693
}
8694
}
8695
}
8696
}
8697
8698
if (convOp == spv::Op::OpNop) {
8699
switch (op) {
8700
case glslang::EOpConvUint64ToPtr:
8701
convOp = spv::Op::OpConvertUToPtr;
8702
break;
8703
case glslang::EOpConvPtrToUint64:
8704
convOp = spv::Op::OpConvertPtrToU;
8705
break;
8706
case glslang::EOpConvPtrToUvec2:
8707
case glslang::EOpConvUvec2ToPtr:
8708
convOp = spv::Op::OpBitcast;
8709
break;
8710
8711
default:
8712
break;
8713
}
8714
}
8715
8716
spv::Id result = 0;
8717
if (convOp == spv::Op::OpNop)
8718
return result;
8719
8720
if (convOp == spv::Op::OpSelect) {
8721
zero = makeSmearedConstant(zero, vectorSize);
8722
one = makeSmearedConstant(one, vectorSize);
8723
result = builder.createTriOp(convOp, destType, operand, one, zero);
8724
} else
8725
result = builder.createUnaryOp(convOp, destType, operand);
8726
8727
result = builder.setPrecision(result, decorations.precision);
8728
decorations.addNonUniform(builder, result);
8729
return result;
8730
}
8731
8732
spv::Id TGlslangToSpvTraverser::makeSmearedConstant(spv::Id constant, int vectorSize)
8733
{
8734
if (vectorSize == 0)
8735
return constant;
8736
8737
spv::Id vectorTypeId = builder.makeVectorType(builder.getTypeId(constant), vectorSize);
8738
std::vector<spv::Id> components;
8739
for (int c = 0; c < vectorSize; ++c)
8740
components.push_back(constant);
8741
return builder.makeCompositeConstant(vectorTypeId, components);
8742
}
8743
8744
// For glslang ops that map to SPV atomic opCodes
8745
spv::Id TGlslangToSpvTraverser::createAtomicOperation(glslang::TOperator op, spv::Decoration /*precision*/,
8746
spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy,
8747
const spv::Builder::AccessChain::CoherentFlags &lvalueCoherentFlags, const glslang::TType &opType)
8748
{
8749
spv::Op opCode = spv::Op::OpNop;
8750
8751
switch (op) {
8752
case glslang::EOpAtomicAdd:
8753
case glslang::EOpImageAtomicAdd:
8754
case glslang::EOpAtomicCounterAdd:
8755
opCode = spv::Op::OpAtomicIAdd;
8756
if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
8757
opCode = spv::Op::OpAtomicFAddEXT;
8758
if (typeProxy == glslang::EbtFloat16 &&
8759
(opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
8760
builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
8761
builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
8762
} else {
8763
builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_add);
8764
if (typeProxy == glslang::EbtFloat16) {
8765
builder.addExtension(spv::E_SPV_EXT_shader_atomic_float16_add);
8766
builder.addCapability(spv::Capability::AtomicFloat16AddEXT);
8767
} else if (typeProxy == glslang::EbtFloat) {
8768
builder.addCapability(spv::Capability::AtomicFloat32AddEXT);
8769
} else {
8770
builder.addCapability(spv::Capability::AtomicFloat64AddEXT);
8771
}
8772
}
8773
}
8774
break;
8775
case glslang::EOpAtomicSubtract:
8776
case glslang::EOpAtomicCounterSubtract:
8777
opCode = spv::Op::OpAtomicISub;
8778
break;
8779
case glslang::EOpAtomicMin:
8780
case glslang::EOpImageAtomicMin:
8781
case glslang::EOpAtomicCounterMin:
8782
if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
8783
opCode = spv::Op::OpAtomicFMinEXT;
8784
if (typeProxy == glslang::EbtFloat16 &&
8785
(opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
8786
builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
8787
builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
8788
} else {
8789
builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_min_max);
8790
if (typeProxy == glslang::EbtFloat16)
8791
builder.addCapability(spv::Capability::AtomicFloat16MinMaxEXT);
8792
else if (typeProxy == glslang::EbtFloat)
8793
builder.addCapability(spv::Capability::AtomicFloat32MinMaxEXT);
8794
else
8795
builder.addCapability(spv::Capability::AtomicFloat64MinMaxEXT);
8796
}
8797
} else if (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) {
8798
opCode = spv::Op::OpAtomicUMin;
8799
} else {
8800
opCode = spv::Op::OpAtomicSMin;
8801
}
8802
break;
8803
case glslang::EOpAtomicMax:
8804
case glslang::EOpImageAtomicMax:
8805
case glslang::EOpAtomicCounterMax:
8806
if (typeProxy == glslang::EbtFloat16 || typeProxy == glslang::EbtFloat || typeProxy == glslang::EbtDouble) {
8807
opCode = spv::Op::OpAtomicFMaxEXT;
8808
if (typeProxy == glslang::EbtFloat16 &&
8809
(opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
8810
builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
8811
builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
8812
} else {
8813
builder.addExtension(spv::E_SPV_EXT_shader_atomic_float_min_max);
8814
if (typeProxy == glslang::EbtFloat16)
8815
builder.addCapability(spv::Capability::AtomicFloat16MinMaxEXT);
8816
else if (typeProxy == glslang::EbtFloat)
8817
builder.addCapability(spv::Capability::AtomicFloat32MinMaxEXT);
8818
else
8819
builder.addCapability(spv::Capability::AtomicFloat64MinMaxEXT);
8820
}
8821
} else if (typeProxy == glslang::EbtUint || typeProxy == glslang::EbtUint64) {
8822
opCode = spv::Op::OpAtomicUMax;
8823
} else {
8824
opCode = spv::Op::OpAtomicSMax;
8825
}
8826
break;
8827
case glslang::EOpAtomicAnd:
8828
case glslang::EOpImageAtomicAnd:
8829
case glslang::EOpAtomicCounterAnd:
8830
opCode = spv::Op::OpAtomicAnd;
8831
break;
8832
case glslang::EOpAtomicOr:
8833
case glslang::EOpImageAtomicOr:
8834
case glslang::EOpAtomicCounterOr:
8835
opCode = spv::Op::OpAtomicOr;
8836
break;
8837
case glslang::EOpAtomicXor:
8838
case glslang::EOpImageAtomicXor:
8839
case glslang::EOpAtomicCounterXor:
8840
opCode = spv::Op::OpAtomicXor;
8841
break;
8842
case glslang::EOpAtomicExchange:
8843
case glslang::EOpImageAtomicExchange:
8844
case glslang::EOpAtomicCounterExchange:
8845
if ((typeProxy == glslang::EbtFloat16) &&
8846
(opType.getVectorSize() == 2 || opType.getVectorSize() == 4)) {
8847
builder.addExtension(spv::E_SPV_NV_shader_atomic_fp16_vector);
8848
builder.addCapability(spv::Capability::AtomicFloat16VectorNV);
8849
}
8850
8851
opCode = spv::Op::OpAtomicExchange;
8852
break;
8853
case glslang::EOpAtomicCompSwap:
8854
case glslang::EOpImageAtomicCompSwap:
8855
case glslang::EOpAtomicCounterCompSwap:
8856
opCode = spv::Op::OpAtomicCompareExchange;
8857
break;
8858
case glslang::EOpAtomicCounterIncrement:
8859
opCode = spv::Op::OpAtomicIIncrement;
8860
break;
8861
case glslang::EOpAtomicCounterDecrement:
8862
opCode = spv::Op::OpAtomicIDecrement;
8863
break;
8864
case glslang::EOpAtomicCounter:
8865
case glslang::EOpImageAtomicLoad:
8866
case glslang::EOpAtomicLoad:
8867
opCode = spv::Op::OpAtomicLoad;
8868
break;
8869
case glslang::EOpAtomicStore:
8870
case glslang::EOpImageAtomicStore:
8871
opCode = spv::Op::OpAtomicStore;
8872
break;
8873
default:
8874
assert(0);
8875
break;
8876
}
8877
8878
if (typeProxy == glslang::EbtInt64 || typeProxy == glslang::EbtUint64)
8879
builder.addCapability(spv::Capability::Int64Atomics);
8880
8881
// Sort out the operands
8882
// - mapping from glslang -> SPV
8883
// - there are extra SPV operands that are optional in glslang
8884
// - compare-exchange swaps the value and comparator
8885
// - compare-exchange has an extra memory semantics
8886
// - EOpAtomicCounterDecrement needs a post decrement
8887
spv::Id pointerId = 0, compareId = 0, valueId = 0;
8888
// scope defaults to Device in the old model, QueueFamilyKHR in the new model
8889
spv::Id scopeId;
8890
if (glslangIntermediate->usingVulkanMemoryModel()) {
8891
scopeId = builder.makeUintConstant(spv::Scope::QueueFamilyKHR);
8892
} else {
8893
scopeId = builder.makeUintConstant(spv::Scope::Device);
8894
}
8895
// semantics default to relaxed
8896
spv::Id semanticsId = builder.makeUintConstant(lvalueCoherentFlags.isVolatile() &&
8897
glslangIntermediate->usingVulkanMemoryModel() ?
8898
spv::MemorySemanticsMask::Volatile :
8899
spv::MemorySemanticsMask::MaskNone);
8900
spv::Id semanticsId2 = semanticsId;
8901
8902
pointerId = operands[0];
8903
if (opCode == spv::Op::OpAtomicIIncrement || opCode == spv::Op::OpAtomicIDecrement) {
8904
// no additional operands
8905
} else if (opCode == spv::Op::OpAtomicCompareExchange) {
8906
compareId = operands[1];
8907
valueId = operands[2];
8908
if (operands.size() > 3) {
8909
scopeId = operands[3];
8910
semanticsId = builder.makeUintConstant(
8911
builder.getConstantScalar(operands[4]) | builder.getConstantScalar(operands[5]));
8912
semanticsId2 = builder.makeUintConstant(
8913
builder.getConstantScalar(operands[6]) | builder.getConstantScalar(operands[7]));
8914
}
8915
} else if (opCode == spv::Op::OpAtomicLoad) {
8916
if (operands.size() > 1) {
8917
scopeId = operands[1];
8918
semanticsId = builder.makeUintConstant(
8919
builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));
8920
}
8921
} else {
8922
// atomic store or RMW
8923
valueId = operands[1];
8924
if (operands.size() > 2) {
8925
scopeId = operands[2];
8926
semanticsId = builder.makeUintConstant
8927
(builder.getConstantScalar(operands[3]) | builder.getConstantScalar(operands[4]));
8928
}
8929
}
8930
8931
// Check for capabilities
8932
auto const semanticsImmediate = (spv::MemorySemanticsMask)(builder.getConstantScalar(semanticsId) | builder.getConstantScalar(semanticsId2));
8933
if (anySet(semanticsImmediate, spv::MemorySemanticsMask::MakeAvailableKHR |
8934
spv::MemorySemanticsMask::MakeVisibleKHR |
8935
spv::MemorySemanticsMask::OutputMemoryKHR |
8936
spv::MemorySemanticsMask::Volatile)) {
8937
builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
8938
}
8939
8940
auto const scope = (spv::Scope)builder.getConstantScalar(scopeId);
8941
if (scope == spv::Scope::QueueFamily) {
8942
builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
8943
}
8944
8945
if (glslangIntermediate->usingVulkanMemoryModel() && scope == spv::Scope::Device) {
8946
builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
8947
}
8948
8949
std::vector<spv::Id> spvAtomicOperands; // hold the spv operands
8950
spvAtomicOperands.reserve(6);
8951
spvAtomicOperands.push_back(pointerId);
8952
spvAtomicOperands.push_back(scopeId);
8953
spvAtomicOperands.push_back(semanticsId);
8954
if (opCode == spv::Op::OpAtomicCompareExchange) {
8955
spvAtomicOperands.push_back(semanticsId2);
8956
spvAtomicOperands.push_back(valueId);
8957
spvAtomicOperands.push_back(compareId);
8958
} else if (opCode != spv::Op::OpAtomicLoad && opCode != spv::Op::OpAtomicIIncrement && opCode != spv::Op::OpAtomicIDecrement) {
8959
spvAtomicOperands.push_back(valueId);
8960
}
8961
8962
if (opCode == spv::Op::OpAtomicStore) {
8963
builder.createNoResultOp(opCode, spvAtomicOperands);
8964
return 0;
8965
} else {
8966
spv::Id resultId = builder.createOp(opCode, typeId, spvAtomicOperands);
8967
8968
// GLSL and HLSL atomic-counter decrement return post-decrement value,
8969
// while SPIR-V returns pre-decrement value. Translate between these semantics.
8970
if (op == glslang::EOpAtomicCounterDecrement)
8971
resultId = builder.createBinOp(spv::Op::OpISub, typeId, resultId, builder.makeIntConstant(1));
8972
8973
return resultId;
8974
}
8975
}
8976
8977
// Create group invocation operations.
8978
spv::Id TGlslangToSpvTraverser::createInvocationsOperation(glslang::TOperator op, spv::Id typeId,
8979
std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
8980
{
8981
bool isUnsigned = isTypeUnsignedInt(typeProxy);
8982
bool isFloat = isTypeFloat(typeProxy);
8983
8984
spv::Op opCode = spv::Op::OpNop;
8985
std::vector<spv::IdImmediate> spvGroupOperands;
8986
spv::GroupOperation groupOperation = spv::GroupOperation::Max;
8987
8988
if (op == glslang::EOpBallot || op == glslang::EOpReadFirstInvocation ||
8989
op == glslang::EOpReadInvocation) {
8990
builder.addExtension(spv::E_SPV_KHR_shader_ballot);
8991
builder.addCapability(spv::Capability::SubgroupBallotKHR);
8992
} else if (op == glslang::EOpAnyInvocation ||
8993
op == glslang::EOpAllInvocations ||
8994
op == glslang::EOpAllInvocationsEqual) {
8995
builder.addExtension(spv::E_SPV_KHR_subgroup_vote);
8996
builder.addCapability(spv::Capability::SubgroupVoteKHR);
8997
} else {
8998
builder.addCapability(spv::Capability::Groups);
8999
if (op == glslang::EOpMinInvocationsNonUniform ||
9000
op == glslang::EOpMaxInvocationsNonUniform ||
9001
op == glslang::EOpAddInvocationsNonUniform ||
9002
op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||
9003
op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||
9004
op == glslang::EOpAddInvocationsInclusiveScanNonUniform ||
9005
op == glslang::EOpMinInvocationsExclusiveScanNonUniform ||
9006
op == glslang::EOpMaxInvocationsExclusiveScanNonUniform ||
9007
op == glslang::EOpAddInvocationsExclusiveScanNonUniform)
9008
builder.addExtension(spv::E_SPV_AMD_shader_ballot);
9009
9010
switch (op) {
9011
case glslang::EOpMinInvocations:
9012
case glslang::EOpMaxInvocations:
9013
case glslang::EOpAddInvocations:
9014
case glslang::EOpMinInvocationsNonUniform:
9015
case glslang::EOpMaxInvocationsNonUniform:
9016
case glslang::EOpAddInvocationsNonUniform:
9017
groupOperation = spv::GroupOperation::Reduce;
9018
break;
9019
case glslang::EOpMinInvocationsInclusiveScan:
9020
case glslang::EOpMaxInvocationsInclusiveScan:
9021
case glslang::EOpAddInvocationsInclusiveScan:
9022
case glslang::EOpMinInvocationsInclusiveScanNonUniform:
9023
case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
9024
case glslang::EOpAddInvocationsInclusiveScanNonUniform:
9025
groupOperation = spv::GroupOperation::InclusiveScan;
9026
break;
9027
case glslang::EOpMinInvocationsExclusiveScan:
9028
case glslang::EOpMaxInvocationsExclusiveScan:
9029
case glslang::EOpAddInvocationsExclusiveScan:
9030
case glslang::EOpMinInvocationsExclusiveScanNonUniform:
9031
case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
9032
case glslang::EOpAddInvocationsExclusiveScanNonUniform:
9033
groupOperation = spv::GroupOperation::ExclusiveScan;
9034
break;
9035
default:
9036
break;
9037
}
9038
spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
9039
spvGroupOperands.push_back(scope);
9040
if (groupOperation != spv::GroupOperation::Max) {
9041
spv::IdImmediate groupOp = { false, (unsigned)groupOperation };
9042
spvGroupOperands.push_back(groupOp);
9043
}
9044
}
9045
9046
for (auto opIt = operands.begin(); opIt != operands.end(); ++opIt) {
9047
spv::IdImmediate op = { true, *opIt };
9048
spvGroupOperands.push_back(op);
9049
}
9050
9051
switch (op) {
9052
case glslang::EOpAnyInvocation:
9053
opCode = spv::Op::OpSubgroupAnyKHR;
9054
break;
9055
case glslang::EOpAllInvocations:
9056
opCode = spv::Op::OpSubgroupAllKHR;
9057
break;
9058
case glslang::EOpAllInvocationsEqual:
9059
opCode = spv::Op::OpSubgroupAllEqualKHR;
9060
break;
9061
case glslang::EOpReadInvocation:
9062
opCode = spv::Op::OpSubgroupReadInvocationKHR;
9063
if (builder.isVectorType(typeId))
9064
return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
9065
break;
9066
case glslang::EOpReadFirstInvocation:
9067
opCode = spv::Op::OpSubgroupFirstInvocationKHR;
9068
if (builder.isVectorType(typeId))
9069
return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
9070
break;
9071
case glslang::EOpBallot:
9072
{
9073
// NOTE: According to the spec, the result type of "OpSubgroupBallotKHR" must be a 4 component vector of 32
9074
// bit integer types. The GLSL built-in function "ballotARB()" assumes the maximum number of invocations in
9075
// a subgroup is 64. Thus, we have to convert uvec4.xy to uint64_t as follow:
9076
//
9077
// result = Bitcast(SubgroupBallotKHR(Predicate).xy)
9078
//
9079
spv::Id uintType = builder.makeUintType(32);
9080
spv::Id uvec4Type = builder.makeVectorType(uintType, 4);
9081
spv::Id result = builder.createOp(spv::Op::OpSubgroupBallotKHR, uvec4Type, spvGroupOperands);
9082
9083
std::vector<spv::Id> components;
9084
components.push_back(builder.createCompositeExtract(result, uintType, 0));
9085
components.push_back(builder.createCompositeExtract(result, uintType, 1));
9086
9087
spv::Id uvec2Type = builder.makeVectorType(uintType, 2);
9088
return builder.createUnaryOp(spv::Op::OpBitcast, typeId,
9089
builder.createCompositeConstruct(uvec2Type, components));
9090
}
9091
9092
case glslang::EOpMinInvocations:
9093
case glslang::EOpMaxInvocations:
9094
case glslang::EOpAddInvocations:
9095
case glslang::EOpMinInvocationsInclusiveScan:
9096
case glslang::EOpMaxInvocationsInclusiveScan:
9097
case glslang::EOpAddInvocationsInclusiveScan:
9098
case glslang::EOpMinInvocationsExclusiveScan:
9099
case glslang::EOpMaxInvocationsExclusiveScan:
9100
case glslang::EOpAddInvocationsExclusiveScan:
9101
if (op == glslang::EOpMinInvocations ||
9102
op == glslang::EOpMinInvocationsInclusiveScan ||
9103
op == glslang::EOpMinInvocationsExclusiveScan) {
9104
if (isFloat)
9105
opCode = spv::Op::OpGroupFMin;
9106
else {
9107
if (isUnsigned)
9108
opCode = spv::Op::OpGroupUMin;
9109
else
9110
opCode = spv::Op::OpGroupSMin;
9111
}
9112
} else if (op == glslang::EOpMaxInvocations ||
9113
op == glslang::EOpMaxInvocationsInclusiveScan ||
9114
op == glslang::EOpMaxInvocationsExclusiveScan) {
9115
if (isFloat)
9116
opCode = spv::Op::OpGroupFMax;
9117
else {
9118
if (isUnsigned)
9119
opCode = spv::Op::OpGroupUMax;
9120
else
9121
opCode = spv::Op::OpGroupSMax;
9122
}
9123
} else {
9124
if (isFloat)
9125
opCode = spv::Op::OpGroupFAdd;
9126
else
9127
opCode = spv::Op::OpGroupIAdd;
9128
}
9129
9130
if (builder.isVectorType(typeId))
9131
return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
9132
9133
break;
9134
case glslang::EOpMinInvocationsNonUniform:
9135
case glslang::EOpMaxInvocationsNonUniform:
9136
case glslang::EOpAddInvocationsNonUniform:
9137
case glslang::EOpMinInvocationsInclusiveScanNonUniform:
9138
case glslang::EOpMaxInvocationsInclusiveScanNonUniform:
9139
case glslang::EOpAddInvocationsInclusiveScanNonUniform:
9140
case glslang::EOpMinInvocationsExclusiveScanNonUniform:
9141
case glslang::EOpMaxInvocationsExclusiveScanNonUniform:
9142
case glslang::EOpAddInvocationsExclusiveScanNonUniform:
9143
if (op == glslang::EOpMinInvocationsNonUniform ||
9144
op == glslang::EOpMinInvocationsInclusiveScanNonUniform ||
9145
op == glslang::EOpMinInvocationsExclusiveScanNonUniform) {
9146
if (isFloat)
9147
opCode = spv::Op::OpGroupFMinNonUniformAMD;
9148
else {
9149
if (isUnsigned)
9150
opCode = spv::Op::OpGroupUMinNonUniformAMD;
9151
else
9152
opCode = spv::Op::OpGroupSMinNonUniformAMD;
9153
}
9154
}
9155
else if (op == glslang::EOpMaxInvocationsNonUniform ||
9156
op == glslang::EOpMaxInvocationsInclusiveScanNonUniform ||
9157
op == glslang::EOpMaxInvocationsExclusiveScanNonUniform) {
9158
if (isFloat)
9159
opCode = spv::Op::OpGroupFMaxNonUniformAMD;
9160
else {
9161
if (isUnsigned)
9162
opCode = spv::Op::OpGroupUMaxNonUniformAMD;
9163
else
9164
opCode = spv::Op::OpGroupSMaxNonUniformAMD;
9165
}
9166
}
9167
else {
9168
if (isFloat)
9169
opCode = spv::Op::OpGroupFAddNonUniformAMD;
9170
else
9171
opCode = spv::Op::OpGroupIAddNonUniformAMD;
9172
}
9173
9174
if (builder.isVectorType(typeId))
9175
return CreateInvocationsVectorOperation(opCode, groupOperation, typeId, operands);
9176
9177
break;
9178
default:
9179
logger->missingFunctionality("invocation operation");
9180
return spv::NoResult;
9181
}
9182
9183
assert(opCode != spv::Op::OpNop);
9184
return builder.createOp(opCode, typeId, spvGroupOperands);
9185
}
9186
9187
// Create group invocation operations on a vector
9188
spv::Id TGlslangToSpvTraverser::CreateInvocationsVectorOperation(spv::Op op, spv::GroupOperation groupOperation,
9189
spv::Id typeId, std::vector<spv::Id>& operands)
9190
{
9191
assert(op == spv::Op::OpGroupFMin || op == spv::Op::OpGroupUMin || op == spv::Op::OpGroupSMin ||
9192
op == spv::Op::OpGroupFMax || op == spv::Op::OpGroupUMax || op == spv::Op::OpGroupSMax ||
9193
op == spv::Op::OpGroupFAdd || op == spv::Op::OpGroupIAdd || op == spv::Op::OpGroupBroadcast ||
9194
op == spv::Op::OpSubgroupReadInvocationKHR || op == spv::Op::OpSubgroupFirstInvocationKHR ||
9195
op == spv::Op::OpGroupFMinNonUniformAMD || op == spv::Op::OpGroupUMinNonUniformAMD ||
9196
op == spv::Op::OpGroupSMinNonUniformAMD ||
9197
op == spv::Op::OpGroupFMaxNonUniformAMD || op == spv::Op::OpGroupUMaxNonUniformAMD ||
9198
op == spv::Op::OpGroupSMaxNonUniformAMD ||
9199
op == spv::Op::OpGroupFAddNonUniformAMD || op == spv::Op::OpGroupIAddNonUniformAMD);
9200
9201
// Handle group invocation operations scalar by scalar.
9202
// The result type is the same type as the original type.
9203
// The algorithm is to:
9204
// - break the vector into scalars
9205
// - apply the operation to each scalar
9206
// - make a vector out the scalar results
9207
9208
// get the types sorted out
9209
int numComponents = builder.getNumComponents(operands[0]);
9210
spv::Id scalarType = builder.getScalarTypeId(builder.getTypeId(operands[0]));
9211
std::vector<spv::Id> results;
9212
9213
// do each scalar op
9214
for (int comp = 0; comp < numComponents; ++comp) {
9215
std::vector<unsigned int> indexes;
9216
indexes.push_back(comp);
9217
spv::IdImmediate scalar = { true, builder.createCompositeExtract(operands[0], scalarType, indexes) };
9218
std::vector<spv::IdImmediate> spvGroupOperands;
9219
if (op == spv::Op::OpSubgroupReadInvocationKHR) {
9220
spvGroupOperands.push_back(scalar);
9221
spv::IdImmediate operand = { true, operands[1] };
9222
spvGroupOperands.push_back(operand);
9223
} else if (op == spv::Op::OpSubgroupFirstInvocationKHR) {
9224
spvGroupOperands.push_back(scalar);
9225
} else if (op == spv::Op::OpGroupBroadcast) {
9226
spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
9227
spvGroupOperands.push_back(scope);
9228
spvGroupOperands.push_back(scalar);
9229
spv::IdImmediate operand = { true, operands[1] };
9230
spvGroupOperands.push_back(operand);
9231
} else {
9232
spv::IdImmediate scope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
9233
spvGroupOperands.push_back(scope);
9234
spv::IdImmediate groupOp = { false, (unsigned)groupOperation };
9235
spvGroupOperands.push_back(groupOp);
9236
spvGroupOperands.push_back(scalar);
9237
}
9238
9239
results.push_back(builder.createOp(op, scalarType, spvGroupOperands));
9240
}
9241
9242
// put the pieces together
9243
return builder.createCompositeConstruct(typeId, results);
9244
}
9245
9246
// Create subgroup invocation operations.
9247
spv::Id TGlslangToSpvTraverser::createSubgroupOperation(glslang::TOperator op, spv::Id typeId,
9248
std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
9249
{
9250
// Add the required capabilities.
9251
switch (op) {
9252
case glslang::EOpSubgroupElect:
9253
builder.addCapability(spv::Capability::GroupNonUniform);
9254
break;
9255
case glslang::EOpSubgroupQuadAll:
9256
case glslang::EOpSubgroupQuadAny:
9257
builder.addExtension(spv::E_SPV_KHR_quad_control);
9258
builder.addCapability(spv::Capability::QuadControlKHR);
9259
[[fallthrough]];
9260
case glslang::EOpSubgroupAll:
9261
case glslang::EOpSubgroupAny:
9262
case glslang::EOpSubgroupAllEqual:
9263
builder.addCapability(spv::Capability::GroupNonUniform);
9264
builder.addCapability(spv::Capability::GroupNonUniformVote);
9265
break;
9266
case glslang::EOpSubgroupBroadcast:
9267
case glslang::EOpSubgroupBroadcastFirst:
9268
case glslang::EOpSubgroupBallot:
9269
case glslang::EOpSubgroupInverseBallot:
9270
case glslang::EOpSubgroupBallotBitExtract:
9271
case glslang::EOpSubgroupBallotBitCount:
9272
case glslang::EOpSubgroupBallotInclusiveBitCount:
9273
case glslang::EOpSubgroupBallotExclusiveBitCount:
9274
case glslang::EOpSubgroupBallotFindLSB:
9275
case glslang::EOpSubgroupBallotFindMSB:
9276
builder.addCapability(spv::Capability::GroupNonUniform);
9277
builder.addCapability(spv::Capability::GroupNonUniformBallot);
9278
break;
9279
case glslang::EOpSubgroupRotate:
9280
case glslang::EOpSubgroupClusteredRotate:
9281
builder.addExtension(spv::E_SPV_KHR_subgroup_rotate);
9282
builder.addCapability(spv::Capability::GroupNonUniformRotateKHR);
9283
break;
9284
case glslang::EOpSubgroupShuffle:
9285
case glslang::EOpSubgroupShuffleXor:
9286
builder.addCapability(spv::Capability::GroupNonUniform);
9287
builder.addCapability(spv::Capability::GroupNonUniformShuffle);
9288
break;
9289
case glslang::EOpSubgroupShuffleUp:
9290
case glslang::EOpSubgroupShuffleDown:
9291
builder.addCapability(spv::Capability::GroupNonUniform);
9292
builder.addCapability(spv::Capability::GroupNonUniformShuffleRelative);
9293
break;
9294
case glslang::EOpSubgroupAdd:
9295
case glslang::EOpSubgroupMul:
9296
case glslang::EOpSubgroupMin:
9297
case glslang::EOpSubgroupMax:
9298
case glslang::EOpSubgroupAnd:
9299
case glslang::EOpSubgroupOr:
9300
case glslang::EOpSubgroupXor:
9301
case glslang::EOpSubgroupInclusiveAdd:
9302
case glslang::EOpSubgroupInclusiveMul:
9303
case glslang::EOpSubgroupInclusiveMin:
9304
case glslang::EOpSubgroupInclusiveMax:
9305
case glslang::EOpSubgroupInclusiveAnd:
9306
case glslang::EOpSubgroupInclusiveOr:
9307
case glslang::EOpSubgroupInclusiveXor:
9308
case glslang::EOpSubgroupExclusiveAdd:
9309
case glslang::EOpSubgroupExclusiveMul:
9310
case glslang::EOpSubgroupExclusiveMin:
9311
case glslang::EOpSubgroupExclusiveMax:
9312
case glslang::EOpSubgroupExclusiveAnd:
9313
case glslang::EOpSubgroupExclusiveOr:
9314
case glslang::EOpSubgroupExclusiveXor:
9315
builder.addCapability(spv::Capability::GroupNonUniform);
9316
builder.addCapability(spv::Capability::GroupNonUniformArithmetic);
9317
break;
9318
case glslang::EOpSubgroupClusteredAdd:
9319
case glslang::EOpSubgroupClusteredMul:
9320
case glslang::EOpSubgroupClusteredMin:
9321
case glslang::EOpSubgroupClusteredMax:
9322
case glslang::EOpSubgroupClusteredAnd:
9323
case glslang::EOpSubgroupClusteredOr:
9324
case glslang::EOpSubgroupClusteredXor:
9325
builder.addCapability(spv::Capability::GroupNonUniform);
9326
builder.addCapability(spv::Capability::GroupNonUniformClustered);
9327
break;
9328
case glslang::EOpSubgroupQuadBroadcast:
9329
case glslang::EOpSubgroupQuadSwapHorizontal:
9330
case glslang::EOpSubgroupQuadSwapVertical:
9331
case glslang::EOpSubgroupQuadSwapDiagonal:
9332
builder.addCapability(spv::Capability::GroupNonUniform);
9333
builder.addCapability(spv::Capability::GroupNonUniformQuad);
9334
break;
9335
case glslang::EOpSubgroupPartitionedAdd:
9336
case glslang::EOpSubgroupPartitionedMul:
9337
case glslang::EOpSubgroupPartitionedMin:
9338
case glslang::EOpSubgroupPartitionedMax:
9339
case glslang::EOpSubgroupPartitionedAnd:
9340
case glslang::EOpSubgroupPartitionedOr:
9341
case glslang::EOpSubgroupPartitionedXor:
9342
case glslang::EOpSubgroupPartitionedInclusiveAdd:
9343
case glslang::EOpSubgroupPartitionedInclusiveMul:
9344
case glslang::EOpSubgroupPartitionedInclusiveMin:
9345
case glslang::EOpSubgroupPartitionedInclusiveMax:
9346
case glslang::EOpSubgroupPartitionedInclusiveAnd:
9347
case glslang::EOpSubgroupPartitionedInclusiveOr:
9348
case glslang::EOpSubgroupPartitionedInclusiveXor:
9349
case glslang::EOpSubgroupPartitionedExclusiveAdd:
9350
case glslang::EOpSubgroupPartitionedExclusiveMul:
9351
case glslang::EOpSubgroupPartitionedExclusiveMin:
9352
case glslang::EOpSubgroupPartitionedExclusiveMax:
9353
case glslang::EOpSubgroupPartitionedExclusiveAnd:
9354
case glslang::EOpSubgroupPartitionedExclusiveOr:
9355
case glslang::EOpSubgroupPartitionedExclusiveXor:
9356
builder.addExtension(spv::E_SPV_NV_shader_subgroup_partitioned);
9357
builder.addCapability(spv::Capability::GroupNonUniformPartitionedNV);
9358
break;
9359
default: assert(0 && "Unhandled subgroup operation!");
9360
}
9361
9362
9363
const bool isUnsigned = isTypeUnsignedInt(typeProxy);
9364
const bool isFloat = isTypeFloat(typeProxy);
9365
const bool isBool = typeProxy == glslang::EbtBool;
9366
9367
spv::Op opCode = spv::Op::OpNop;
9368
9369
// Figure out which opcode to use.
9370
switch (op) {
9371
case glslang::EOpSubgroupElect: opCode = spv::Op::OpGroupNonUniformElect; break;
9372
case glslang::EOpSubgroupQuadAll: opCode = spv::Op::OpGroupNonUniformQuadAllKHR; break;
9373
case glslang::EOpSubgroupAll: opCode = spv::Op::OpGroupNonUniformAll; break;
9374
case glslang::EOpSubgroupQuadAny: opCode = spv::Op::OpGroupNonUniformQuadAnyKHR; break;
9375
case glslang::EOpSubgroupAny: opCode = spv::Op::OpGroupNonUniformAny; break;
9376
case glslang::EOpSubgroupAllEqual: opCode = spv::Op::OpGroupNonUniformAllEqual; break;
9377
case glslang::EOpSubgroupBroadcast: opCode = spv::Op::OpGroupNonUniformBroadcast; break;
9378
case glslang::EOpSubgroupBroadcastFirst: opCode = spv::Op::OpGroupNonUniformBroadcastFirst; break;
9379
case glslang::EOpSubgroupBallot: opCode = spv::Op::OpGroupNonUniformBallot; break;
9380
case glslang::EOpSubgroupInverseBallot: opCode = spv::Op::OpGroupNonUniformInverseBallot; break;
9381
case glslang::EOpSubgroupBallotBitExtract: opCode = spv::Op::OpGroupNonUniformBallotBitExtract; break;
9382
case glslang::EOpSubgroupBallotBitCount:
9383
case glslang::EOpSubgroupBallotInclusiveBitCount:
9384
case glslang::EOpSubgroupBallotExclusiveBitCount: opCode = spv::Op::OpGroupNonUniformBallotBitCount; break;
9385
case glslang::EOpSubgroupBallotFindLSB: opCode = spv::Op::OpGroupNonUniformBallotFindLSB; break;
9386
case glslang::EOpSubgroupBallotFindMSB: opCode = spv::Op::OpGroupNonUniformBallotFindMSB; break;
9387
case glslang::EOpSubgroupShuffle: opCode = spv::Op::OpGroupNonUniformShuffle; break;
9388
case glslang::EOpSubgroupShuffleXor: opCode = spv::Op::OpGroupNonUniformShuffleXor; break;
9389
case glslang::EOpSubgroupShuffleUp: opCode = spv::Op::OpGroupNonUniformShuffleUp; break;
9390
case glslang::EOpSubgroupShuffleDown: opCode = spv::Op::OpGroupNonUniformShuffleDown; break;
9391
case glslang::EOpSubgroupRotate:
9392
case glslang::EOpSubgroupClusteredRotate: opCode = spv::Op::OpGroupNonUniformRotateKHR; break;
9393
case glslang::EOpSubgroupAdd:
9394
case glslang::EOpSubgroupInclusiveAdd:
9395
case glslang::EOpSubgroupExclusiveAdd:
9396
case glslang::EOpSubgroupClusteredAdd:
9397
case glslang::EOpSubgroupPartitionedAdd:
9398
case glslang::EOpSubgroupPartitionedInclusiveAdd:
9399
case glslang::EOpSubgroupPartitionedExclusiveAdd:
9400
if (isFloat) {
9401
opCode = spv::Op::OpGroupNonUniformFAdd;
9402
} else {
9403
opCode = spv::Op::OpGroupNonUniformIAdd;
9404
}
9405
break;
9406
case glslang::EOpSubgroupMul:
9407
case glslang::EOpSubgroupInclusiveMul:
9408
case glslang::EOpSubgroupExclusiveMul:
9409
case glslang::EOpSubgroupClusteredMul:
9410
case glslang::EOpSubgroupPartitionedMul:
9411
case glslang::EOpSubgroupPartitionedInclusiveMul:
9412
case glslang::EOpSubgroupPartitionedExclusiveMul:
9413
if (isFloat) {
9414
opCode = spv::Op::OpGroupNonUniformFMul;
9415
} else {
9416
opCode = spv::Op::OpGroupNonUniformIMul;
9417
}
9418
break;
9419
case glslang::EOpSubgroupMin:
9420
case glslang::EOpSubgroupInclusiveMin:
9421
case glslang::EOpSubgroupExclusiveMin:
9422
case glslang::EOpSubgroupClusteredMin:
9423
case glslang::EOpSubgroupPartitionedMin:
9424
case glslang::EOpSubgroupPartitionedInclusiveMin:
9425
case glslang::EOpSubgroupPartitionedExclusiveMin:
9426
if (isFloat) {
9427
opCode = spv::Op::OpGroupNonUniformFMin;
9428
} else if (isUnsigned) {
9429
opCode = spv::Op::OpGroupNonUniformUMin;
9430
} else {
9431
opCode = spv::Op::OpGroupNonUniformSMin;
9432
}
9433
break;
9434
case glslang::EOpSubgroupMax:
9435
case glslang::EOpSubgroupInclusiveMax:
9436
case glslang::EOpSubgroupExclusiveMax:
9437
case glslang::EOpSubgroupClusteredMax:
9438
case glslang::EOpSubgroupPartitionedMax:
9439
case glslang::EOpSubgroupPartitionedInclusiveMax:
9440
case glslang::EOpSubgroupPartitionedExclusiveMax:
9441
if (isFloat) {
9442
opCode = spv::Op::OpGroupNonUniformFMax;
9443
} else if (isUnsigned) {
9444
opCode = spv::Op::OpGroupNonUniformUMax;
9445
} else {
9446
opCode = spv::Op::OpGroupNonUniformSMax;
9447
}
9448
break;
9449
case glslang::EOpSubgroupAnd:
9450
case glslang::EOpSubgroupInclusiveAnd:
9451
case glslang::EOpSubgroupExclusiveAnd:
9452
case glslang::EOpSubgroupClusteredAnd:
9453
case glslang::EOpSubgroupPartitionedAnd:
9454
case glslang::EOpSubgroupPartitionedInclusiveAnd:
9455
case glslang::EOpSubgroupPartitionedExclusiveAnd:
9456
if (isBool) {
9457
opCode = spv::Op::OpGroupNonUniformLogicalAnd;
9458
} else {
9459
opCode = spv::Op::OpGroupNonUniformBitwiseAnd;
9460
}
9461
break;
9462
case glslang::EOpSubgroupOr:
9463
case glslang::EOpSubgroupInclusiveOr:
9464
case glslang::EOpSubgroupExclusiveOr:
9465
case glslang::EOpSubgroupClusteredOr:
9466
case glslang::EOpSubgroupPartitionedOr:
9467
case glslang::EOpSubgroupPartitionedInclusiveOr:
9468
case glslang::EOpSubgroupPartitionedExclusiveOr:
9469
if (isBool) {
9470
opCode = spv::Op::OpGroupNonUniformLogicalOr;
9471
} else {
9472
opCode = spv::Op::OpGroupNonUniformBitwiseOr;
9473
}
9474
break;
9475
case glslang::EOpSubgroupXor:
9476
case glslang::EOpSubgroupInclusiveXor:
9477
case glslang::EOpSubgroupExclusiveXor:
9478
case glslang::EOpSubgroupClusteredXor:
9479
case glslang::EOpSubgroupPartitionedXor:
9480
case glslang::EOpSubgroupPartitionedInclusiveXor:
9481
case glslang::EOpSubgroupPartitionedExclusiveXor:
9482
if (isBool) {
9483
opCode = spv::Op::OpGroupNonUniformLogicalXor;
9484
} else {
9485
opCode = spv::Op::OpGroupNonUniformBitwiseXor;
9486
}
9487
break;
9488
case glslang::EOpSubgroupQuadBroadcast: opCode = spv::Op::OpGroupNonUniformQuadBroadcast; break;
9489
case glslang::EOpSubgroupQuadSwapHorizontal:
9490
case glslang::EOpSubgroupQuadSwapVertical:
9491
case glslang::EOpSubgroupQuadSwapDiagonal: opCode = spv::Op::OpGroupNonUniformQuadSwap; break;
9492
default: assert(0 && "Unhandled subgroup operation!");
9493
}
9494
9495
// get the right Group Operation
9496
spv::GroupOperation groupOperation = spv::GroupOperation::Max;
9497
switch (op) {
9498
default:
9499
break;
9500
case glslang::EOpSubgroupBallotBitCount:
9501
case glslang::EOpSubgroupAdd:
9502
case glslang::EOpSubgroupMul:
9503
case glslang::EOpSubgroupMin:
9504
case glslang::EOpSubgroupMax:
9505
case glslang::EOpSubgroupAnd:
9506
case glslang::EOpSubgroupOr:
9507
case glslang::EOpSubgroupXor:
9508
groupOperation = spv::GroupOperation::Reduce;
9509
break;
9510
case glslang::EOpSubgroupBallotInclusiveBitCount:
9511
case glslang::EOpSubgroupInclusiveAdd:
9512
case glslang::EOpSubgroupInclusiveMul:
9513
case glslang::EOpSubgroupInclusiveMin:
9514
case glslang::EOpSubgroupInclusiveMax:
9515
case glslang::EOpSubgroupInclusiveAnd:
9516
case glslang::EOpSubgroupInclusiveOr:
9517
case glslang::EOpSubgroupInclusiveXor:
9518
groupOperation = spv::GroupOperation::InclusiveScan;
9519
break;
9520
case glslang::EOpSubgroupBallotExclusiveBitCount:
9521
case glslang::EOpSubgroupExclusiveAdd:
9522
case glslang::EOpSubgroupExclusiveMul:
9523
case glslang::EOpSubgroupExclusiveMin:
9524
case glslang::EOpSubgroupExclusiveMax:
9525
case glslang::EOpSubgroupExclusiveAnd:
9526
case glslang::EOpSubgroupExclusiveOr:
9527
case glslang::EOpSubgroupExclusiveXor:
9528
groupOperation = spv::GroupOperation::ExclusiveScan;
9529
break;
9530
case glslang::EOpSubgroupClusteredAdd:
9531
case glslang::EOpSubgroupClusteredMul:
9532
case glslang::EOpSubgroupClusteredMin:
9533
case glslang::EOpSubgroupClusteredMax:
9534
case glslang::EOpSubgroupClusteredAnd:
9535
case glslang::EOpSubgroupClusteredOr:
9536
case glslang::EOpSubgroupClusteredXor:
9537
groupOperation = spv::GroupOperation::ClusteredReduce;
9538
break;
9539
case glslang::EOpSubgroupPartitionedAdd:
9540
case glslang::EOpSubgroupPartitionedMul:
9541
case glslang::EOpSubgroupPartitionedMin:
9542
case glslang::EOpSubgroupPartitionedMax:
9543
case glslang::EOpSubgroupPartitionedAnd:
9544
case glslang::EOpSubgroupPartitionedOr:
9545
case glslang::EOpSubgroupPartitionedXor:
9546
groupOperation = spv::GroupOperation::PartitionedReduceNV;
9547
break;
9548
case glslang::EOpSubgroupPartitionedInclusiveAdd:
9549
case glslang::EOpSubgroupPartitionedInclusiveMul:
9550
case glslang::EOpSubgroupPartitionedInclusiveMin:
9551
case glslang::EOpSubgroupPartitionedInclusiveMax:
9552
case glslang::EOpSubgroupPartitionedInclusiveAnd:
9553
case glslang::EOpSubgroupPartitionedInclusiveOr:
9554
case glslang::EOpSubgroupPartitionedInclusiveXor:
9555
groupOperation = spv::GroupOperation::PartitionedInclusiveScanNV;
9556
break;
9557
case glslang::EOpSubgroupPartitionedExclusiveAdd:
9558
case glslang::EOpSubgroupPartitionedExclusiveMul:
9559
case glslang::EOpSubgroupPartitionedExclusiveMin:
9560
case glslang::EOpSubgroupPartitionedExclusiveMax:
9561
case glslang::EOpSubgroupPartitionedExclusiveAnd:
9562
case glslang::EOpSubgroupPartitionedExclusiveOr:
9563
case glslang::EOpSubgroupPartitionedExclusiveXor:
9564
groupOperation = spv::GroupOperation::PartitionedExclusiveScanNV;
9565
break;
9566
}
9567
9568
// build the instruction
9569
std::vector<spv::IdImmediate> spvGroupOperands;
9570
9571
// Every operation begins with the Execution Scope operand.
9572
spv::IdImmediate executionScope = { true, builder.makeUintConstant(spv::Scope::Subgroup) };
9573
// All other ops need the execution scope. Quad Control Ops don't need scope, it's always Quad.
9574
if (opCode != spv::Op::OpGroupNonUniformQuadAllKHR && opCode != spv::Op::OpGroupNonUniformQuadAnyKHR) {
9575
spvGroupOperands.push_back(executionScope);
9576
}
9577
9578
// Next, for all operations that use a Group Operation, push that as an operand.
9579
if (groupOperation != spv::GroupOperation::Max) {
9580
spv::IdImmediate groupOperand = { false, (unsigned)groupOperation };
9581
spvGroupOperands.push_back(groupOperand);
9582
}
9583
9584
// Push back the operands next.
9585
for (auto opIt = operands.cbegin(); opIt != operands.cend(); ++opIt) {
9586
spv::IdImmediate operand = { true, *opIt };
9587
spvGroupOperands.push_back(operand);
9588
}
9589
9590
// Some opcodes have additional operands.
9591
spv::Id directionId = spv::NoResult;
9592
switch (op) {
9593
default: break;
9594
case glslang::EOpSubgroupQuadSwapHorizontal: directionId = builder.makeUintConstant(0); break;
9595
case glslang::EOpSubgroupQuadSwapVertical: directionId = builder.makeUintConstant(1); break;
9596
case glslang::EOpSubgroupQuadSwapDiagonal: directionId = builder.makeUintConstant(2); break;
9597
}
9598
if (directionId != spv::NoResult) {
9599
spv::IdImmediate direction = { true, directionId };
9600
spvGroupOperands.push_back(direction);
9601
}
9602
9603
return builder.createOp(opCode, typeId, spvGroupOperands);
9604
}
9605
9606
spv::Id TGlslangToSpvTraverser::createMiscOperation(glslang::TOperator op, spv::Decoration precision,
9607
spv::Id typeId, std::vector<spv::Id>& operands, glslang::TBasicType typeProxy)
9608
{
9609
bool isUnsigned = isTypeUnsignedInt(typeProxy);
9610
bool isFloat = isTypeFloat(typeProxy);
9611
9612
spv::Op opCode = spv::Op::OpNop;
9613
int extBuiltins = -1;
9614
int libCall = -1;
9615
size_t consumedOperands = operands.size();
9616
spv::Id typeId0 = 0;
9617
if (consumedOperands > 0)
9618
typeId0 = builder.getTypeId(operands[0]);
9619
spv::Id typeId1 = 0;
9620
if (consumedOperands > 1)
9621
typeId1 = builder.getTypeId(operands[1]);
9622
spv::Id frexpIntType = 0;
9623
9624
switch (op) {
9625
case glslang::EOpMin:
9626
if (isFloat)
9627
libCall = nanMinMaxClamp ? spv::GLSLstd450NMin : spv::GLSLstd450FMin;
9628
else if (isUnsigned)
9629
libCall = spv::GLSLstd450UMin;
9630
else
9631
libCall = spv::GLSLstd450SMin;
9632
builder.promoteScalar(precision, operands.front(), operands.back());
9633
break;
9634
case glslang::EOpModf:
9635
{
9636
libCall = spv::GLSLstd450ModfStruct;
9637
assert(builder.isFloatType(builder.getScalarTypeId(typeId0)));
9638
// The returned struct has two members of the same type as the first argument
9639
typeId = builder.makeStructResultType(typeId0, typeId0);
9640
consumedOperands = 1;
9641
}
9642
break;
9643
case glslang::EOpMax:
9644
if (isFloat)
9645
libCall = nanMinMaxClamp ? spv::GLSLstd450NMax : spv::GLSLstd450FMax;
9646
else if (isUnsigned)
9647
libCall = spv::GLSLstd450UMax;
9648
else
9649
libCall = spv::GLSLstd450SMax;
9650
builder.promoteScalar(precision, operands.front(), operands.back());
9651
break;
9652
case glslang::EOpPow:
9653
libCall = spv::GLSLstd450Pow;
9654
break;
9655
case glslang::EOpDot:
9656
case glslang::EOpDotPackedEXT:
9657
case glslang::EOpDotAccSatEXT:
9658
case glslang::EOpDotPackedAccSatEXT:
9659
{
9660
if (builder.isFloatType(builder.getScalarTypeId(typeId0)) ||
9661
// HLSL supports dot(int,int) which is just a multiply
9662
glslangIntermediate->getSource() == glslang::EShSourceHlsl) {
9663
if (typeProxy == glslang::EbtBFloat16) {
9664
builder.addExtension(spv::E_SPV_KHR_bfloat16);
9665
builder.addCapability(spv::Capability::BFloat16DotProductKHR);
9666
}
9667
opCode = spv::Op::OpDot;
9668
} else {
9669
builder.addExtension(spv::E_SPV_KHR_integer_dot_product);
9670
builder.addCapability(spv::Capability::DotProductKHR);
9671
const unsigned int vectorSize = builder.getNumComponents(operands[0]);
9672
if (op == glslang::EOpDotPackedEXT || op == glslang::EOpDotPackedAccSatEXT) {
9673
builder.addCapability(spv::Capability::DotProductInput4x8BitPackedKHR);
9674
} else if (vectorSize == 4 && builder.getScalarTypeWidth(typeId0) == 8) {
9675
builder.addCapability(spv::Capability::DotProductInput4x8BitKHR);
9676
} else {
9677
builder.addCapability(spv::Capability::DotProductInputAllKHR);
9678
}
9679
const bool type0isSigned = builder.isIntType(builder.getScalarTypeId(typeId0));
9680
const bool type1isSigned = builder.isIntType(builder.getScalarTypeId(typeId1));
9681
const bool accSat = (op == glslang::EOpDotAccSatEXT || op == glslang::EOpDotPackedAccSatEXT);
9682
if (!type0isSigned && !type1isSigned) {
9683
opCode = accSat ? spv::Op::OpUDotAccSatKHR : spv::Op::OpUDotKHR;
9684
} else if (type0isSigned && type1isSigned) {
9685
opCode = accSat ? spv::Op::OpSDotAccSatKHR : spv::Op::OpSDotKHR;
9686
} else {
9687
opCode = accSat ? spv::Op::OpSUDotAccSatKHR : spv::Op::OpSUDotKHR;
9688
// the spir-v opcode assumes the operands to be "signed, unsigned" in that order, so swap if needed
9689
if (type1isSigned) {
9690
std::swap(operands[0], operands[1]);
9691
}
9692
}
9693
std::vector<spv::IdImmediate> operands2;
9694
for (auto &o : operands) {
9695
operands2.push_back({true, o});
9696
}
9697
if (op == glslang::EOpDotPackedEXT || op == glslang::EOpDotPackedAccSatEXT) {
9698
operands2.push_back({false, 0});
9699
}
9700
return builder.createOp(opCode, typeId, operands2);
9701
}
9702
}
9703
break;
9704
case glslang::EOpAtan:
9705
libCall = spv::GLSLstd450Atan2;
9706
break;
9707
9708
case glslang::EOpClamp:
9709
if (isFloat)
9710
libCall = nanMinMaxClamp ? spv::GLSLstd450NClamp : spv::GLSLstd450FClamp;
9711
else if (isUnsigned)
9712
libCall = spv::GLSLstd450UClamp;
9713
else
9714
libCall = spv::GLSLstd450SClamp;
9715
builder.promoteScalar(precision, operands.front(), operands[1]);
9716
builder.promoteScalar(precision, operands.front(), operands[2]);
9717
break;
9718
case glslang::EOpMix:
9719
if (! builder.isBoolType(builder.getScalarTypeId(builder.getTypeId(operands.back())))) {
9720
assert(isFloat);
9721
libCall = spv::GLSLstd450FMix;
9722
} else {
9723
opCode = spv::Op::OpSelect;
9724
std::swap(operands.front(), operands.back());
9725
}
9726
builder.promoteScalar(precision, operands.front(), operands.back());
9727
break;
9728
case glslang::EOpStep:
9729
libCall = spv::GLSLstd450Step;
9730
builder.promoteScalar(precision, operands.front(), operands.back());
9731
break;
9732
case glslang::EOpSmoothStep:
9733
libCall = spv::GLSLstd450SmoothStep;
9734
builder.promoteScalar(precision, operands[0], operands[2]);
9735
builder.promoteScalar(precision, operands[1], operands[2]);
9736
break;
9737
9738
case glslang::EOpDistance:
9739
libCall = spv::GLSLstd450Distance;
9740
break;
9741
case glslang::EOpCross:
9742
libCall = spv::GLSLstd450Cross;
9743
break;
9744
case glslang::EOpFaceForward:
9745
libCall = spv::GLSLstd450FaceForward;
9746
break;
9747
case glslang::EOpReflect:
9748
libCall = spv::GLSLstd450Reflect;
9749
break;
9750
case glslang::EOpRefract:
9751
libCall = spv::GLSLstd450Refract;
9752
break;
9753
case glslang::EOpBarrier:
9754
{
9755
// This is for the extended controlBarrier function, with four operands.
9756
// The unextended barrier() goes through createNoArgOperation.
9757
assert(operands.size() == 4);
9758
auto const executionScope = (spv::Scope)builder.getConstantScalar(operands[0]);
9759
auto const memoryScope = (spv::Scope)builder.getConstantScalar(operands[1]);
9760
auto const semantics = (spv::MemorySemanticsMask)(builder.getConstantScalar(operands[2]) | builder.getConstantScalar(operands[3]));
9761
builder.createControlBarrier(executionScope, memoryScope,
9762
semantics);
9763
if (anySet(semantics, spv::MemorySemanticsMask::MakeAvailableKHR |
9764
spv::MemorySemanticsMask::MakeVisibleKHR |
9765
spv::MemorySemanticsMask::OutputMemoryKHR |
9766
spv::MemorySemanticsMask::Volatile)) {
9767
builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
9768
}
9769
if (glslangIntermediate->usingVulkanMemoryModel() && (executionScope == spv::Scope::Device ||
9770
memoryScope == spv::Scope::Device)) {
9771
builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
9772
}
9773
return 0;
9774
}
9775
break;
9776
case glslang::EOpMemoryBarrier:
9777
{
9778
// This is for the extended memoryBarrier function, with three operands.
9779
// The unextended memoryBarrier() goes through createNoArgOperation.
9780
assert(operands.size() == 3);
9781
auto const memoryScope = (spv::Scope)builder.getConstantScalar(operands[0]);
9782
auto const semantics = (spv::MemorySemanticsMask)(builder.getConstantScalar(operands[1]) | builder.getConstantScalar(operands[2]));
9783
builder.createMemoryBarrier(memoryScope, semantics);
9784
if (anySet(semantics, spv::MemorySemanticsMask::MakeAvailableKHR |
9785
spv::MemorySemanticsMask::MakeVisibleKHR |
9786
spv::MemorySemanticsMask::OutputMemoryKHR |
9787
spv::MemorySemanticsMask::Volatile)) {
9788
builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
9789
}
9790
if (glslangIntermediate->usingVulkanMemoryModel() && memoryScope == spv::Scope::Device) {
9791
builder.addCapability(spv::Capability::VulkanMemoryModelDeviceScopeKHR);
9792
}
9793
return 0;
9794
}
9795
break;
9796
9797
case glslang::EOpInterpolateAtSample:
9798
if (typeProxy == glslang::EbtFloat16)
9799
builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
9800
libCall = spv::GLSLstd450InterpolateAtSample;
9801
break;
9802
case glslang::EOpInterpolateAtOffset:
9803
if (typeProxy == glslang::EbtFloat16)
9804
builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
9805
libCall = spv::GLSLstd450InterpolateAtOffset;
9806
break;
9807
case glslang::EOpAddCarry:
9808
opCode = spv::Op::OpIAddCarry;
9809
typeId = builder.makeStructResultType(typeId0, typeId0);
9810
consumedOperands = 2;
9811
break;
9812
case glslang::EOpSubBorrow:
9813
opCode = spv::Op::OpISubBorrow;
9814
typeId = builder.makeStructResultType(typeId0, typeId0);
9815
consumedOperands = 2;
9816
break;
9817
case glslang::EOpUMulExtended:
9818
opCode = spv::Op::OpUMulExtended;
9819
typeId = builder.makeStructResultType(typeId0, typeId0);
9820
consumedOperands = 2;
9821
break;
9822
case glslang::EOpIMulExtended:
9823
opCode = spv::Op::OpSMulExtended;
9824
typeId = builder.makeStructResultType(typeId0, typeId0);
9825
consumedOperands = 2;
9826
break;
9827
case glslang::EOpBitfieldExtract:
9828
if (isUnsigned)
9829
opCode = spv::Op::OpBitFieldUExtract;
9830
else
9831
opCode = spv::Op::OpBitFieldSExtract;
9832
break;
9833
case glslang::EOpBitfieldInsert:
9834
opCode = spv::Op::OpBitFieldInsert;
9835
break;
9836
9837
case glslang::EOpFma:
9838
libCall = spv::GLSLstd450Fma;
9839
break;
9840
case glslang::EOpFrexp:
9841
{
9842
libCall = spv::GLSLstd450FrexpStruct;
9843
assert(builder.isPointerType(typeId1));
9844
typeId1 = builder.getContainedTypeId(typeId1);
9845
int width = builder.getScalarTypeWidth(typeId1);
9846
if (width == 16)
9847
// Using 16-bit exp operand, enable extension SPV_AMD_gpu_shader_int16
9848
builder.addExtension(spv::E_SPV_AMD_gpu_shader_int16);
9849
if (builder.getNumComponents(operands[0]) == 1)
9850
frexpIntType = builder.makeIntegerType(width, true);
9851
else
9852
frexpIntType = builder.makeVectorType(builder.makeIntegerType(width, true),
9853
builder.getNumComponents(operands[0]));
9854
typeId = builder.makeStructResultType(typeId0, frexpIntType);
9855
consumedOperands = 1;
9856
}
9857
break;
9858
case glslang::EOpLdexp:
9859
libCall = spv::GLSLstd450Ldexp;
9860
break;
9861
9862
case glslang::EOpReadInvocation:
9863
return createInvocationsOperation(op, typeId, operands, typeProxy);
9864
9865
case glslang::EOpSubgroupBroadcast:
9866
case glslang::EOpSubgroupBallotBitExtract:
9867
case glslang::EOpSubgroupShuffle:
9868
case glslang::EOpSubgroupShuffleXor:
9869
case glslang::EOpSubgroupShuffleUp:
9870
case glslang::EOpSubgroupShuffleDown:
9871
case glslang::EOpSubgroupRotate:
9872
case glslang::EOpSubgroupClusteredRotate:
9873
case glslang::EOpSubgroupClusteredAdd:
9874
case glslang::EOpSubgroupClusteredMul:
9875
case glslang::EOpSubgroupClusteredMin:
9876
case glslang::EOpSubgroupClusteredMax:
9877
case glslang::EOpSubgroupClusteredAnd:
9878
case glslang::EOpSubgroupClusteredOr:
9879
case glslang::EOpSubgroupClusteredXor:
9880
case glslang::EOpSubgroupQuadBroadcast:
9881
case glslang::EOpSubgroupPartitionedAdd:
9882
case glslang::EOpSubgroupPartitionedMul:
9883
case glslang::EOpSubgroupPartitionedMin:
9884
case glslang::EOpSubgroupPartitionedMax:
9885
case glslang::EOpSubgroupPartitionedAnd:
9886
case glslang::EOpSubgroupPartitionedOr:
9887
case glslang::EOpSubgroupPartitionedXor:
9888
case glslang::EOpSubgroupPartitionedInclusiveAdd:
9889
case glslang::EOpSubgroupPartitionedInclusiveMul:
9890
case glslang::EOpSubgroupPartitionedInclusiveMin:
9891
case glslang::EOpSubgroupPartitionedInclusiveMax:
9892
case glslang::EOpSubgroupPartitionedInclusiveAnd:
9893
case glslang::EOpSubgroupPartitionedInclusiveOr:
9894
case glslang::EOpSubgroupPartitionedInclusiveXor:
9895
case glslang::EOpSubgroupPartitionedExclusiveAdd:
9896
case glslang::EOpSubgroupPartitionedExclusiveMul:
9897
case glslang::EOpSubgroupPartitionedExclusiveMin:
9898
case glslang::EOpSubgroupPartitionedExclusiveMax:
9899
case glslang::EOpSubgroupPartitionedExclusiveAnd:
9900
case glslang::EOpSubgroupPartitionedExclusiveOr:
9901
case glslang::EOpSubgroupPartitionedExclusiveXor:
9902
return createSubgroupOperation(op, typeId, operands, typeProxy);
9903
9904
case glslang::EOpSwizzleInvocations:
9905
extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
9906
libCall = spv::SwizzleInvocationsAMD;
9907
break;
9908
case glslang::EOpSwizzleInvocationsMasked:
9909
extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
9910
libCall = spv::SwizzleInvocationsMaskedAMD;
9911
break;
9912
case glslang::EOpWriteInvocation:
9913
extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_ballot);
9914
libCall = spv::WriteInvocationAMD;
9915
break;
9916
9917
case glslang::EOpMin3:
9918
extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
9919
if (isFloat)
9920
libCall = spv::FMin3AMD;
9921
else {
9922
if (isUnsigned)
9923
libCall = spv::UMin3AMD;
9924
else
9925
libCall = spv::SMin3AMD;
9926
}
9927
break;
9928
case glslang::EOpMax3:
9929
extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
9930
if (isFloat)
9931
libCall = spv::FMax3AMD;
9932
else {
9933
if (isUnsigned)
9934
libCall = spv::UMax3AMD;
9935
else
9936
libCall = spv::SMax3AMD;
9937
}
9938
break;
9939
case glslang::EOpMid3:
9940
extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_trinary_minmax);
9941
if (isFloat)
9942
libCall = spv::FMid3AMD;
9943
else {
9944
if (isUnsigned)
9945
libCall = spv::UMid3AMD;
9946
else
9947
libCall = spv::SMid3AMD;
9948
}
9949
break;
9950
9951
case glslang::EOpInterpolateAtVertex:
9952
if (typeProxy == glslang::EbtFloat16)
9953
builder.addExtension(spv::E_SPV_AMD_gpu_shader_half_float);
9954
extBuiltins = getExtBuiltins(spv::E_SPV_AMD_shader_explicit_vertex_parameter);
9955
libCall = spv::InterpolateAtVertexAMD;
9956
break;
9957
9958
case glslang::EOpReportIntersection:
9959
typeId = builder.makeBoolType();
9960
opCode = spv::Op::OpReportIntersectionKHR;
9961
break;
9962
case glslang::EOpTraceNV:
9963
builder.createNoResultOp(spv::Op::OpTraceNV, operands);
9964
return 0;
9965
case glslang::EOpTraceRayMotionNV:
9966
builder.addExtension(spv::E_SPV_NV_ray_tracing_motion_blur);
9967
builder.addCapability(spv::Capability::RayTracingMotionBlurNV);
9968
builder.createNoResultOp(spv::Op::OpTraceRayMotionNV, operands);
9969
return 0;
9970
case glslang::EOpTraceKHR:
9971
builder.createNoResultOp(spv::Op::OpTraceRayKHR, operands);
9972
return 0;
9973
case glslang::EOpExecuteCallableNV:
9974
builder.createNoResultOp(spv::Op::OpExecuteCallableNV, operands);
9975
return 0;
9976
case glslang::EOpExecuteCallableKHR:
9977
builder.createNoResultOp(spv::Op::OpExecuteCallableKHR, operands);
9978
return 0;
9979
9980
case glslang::EOpRayQueryInitialize:
9981
builder.createNoResultOp(spv::Op::OpRayQueryInitializeKHR, operands);
9982
return 0;
9983
case glslang::EOpRayQueryTerminate:
9984
builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR, operands);
9985
return 0;
9986
case glslang::EOpRayQueryGenerateIntersection:
9987
builder.createNoResultOp(spv::Op::OpRayQueryGenerateIntersectionKHR, operands);
9988
return 0;
9989
case glslang::EOpRayQueryConfirmIntersection:
9990
builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR, operands);
9991
return 0;
9992
case glslang::EOpRayQueryProceed:
9993
typeId = builder.makeBoolType();
9994
opCode = spv::Op::OpRayQueryProceedKHR;
9995
break;
9996
case glslang::EOpRayQueryGetIntersectionType:
9997
typeId = builder.makeUintType(32);
9998
opCode = spv::Op::OpRayQueryGetIntersectionTypeKHR;
9999
break;
10000
case glslang::EOpRayQueryGetRayTMin:
10001
typeId = builder.makeFloatType(32);
10002
opCode = spv::Op::OpRayQueryGetRayTMinKHR;
10003
break;
10004
case glslang::EOpRayQueryGetRayFlags:
10005
typeId = builder.makeIntType(32);
10006
opCode = spv::Op::OpRayQueryGetRayFlagsKHR;
10007
break;
10008
case glslang::EOpRayQueryGetIntersectionT:
10009
typeId = builder.makeFloatType(32);
10010
opCode = spv::Op::OpRayQueryGetIntersectionTKHR;
10011
break;
10012
case glslang::EOpRayQueryGetIntersectionInstanceCustomIndex:
10013
typeId = builder.makeIntType(32);
10014
opCode = spv::Op::OpRayQueryGetIntersectionInstanceCustomIndexKHR;
10015
break;
10016
case glslang::EOpRayQueryGetIntersectionInstanceId:
10017
typeId = builder.makeIntType(32);
10018
opCode = spv::Op::OpRayQueryGetIntersectionInstanceIdKHR;
10019
break;
10020
case glslang::EOpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffset:
10021
typeId = builder.makeUintType(32);
10022
opCode = spv::Op::OpRayQueryGetIntersectionInstanceShaderBindingTableRecordOffsetKHR;
10023
break;
10024
case glslang::EOpRayQueryGetIntersectionGeometryIndex:
10025
typeId = builder.makeIntType(32);
10026
opCode = spv::Op::OpRayQueryGetIntersectionGeometryIndexKHR;
10027
break;
10028
case glslang::EOpRayQueryGetIntersectionPrimitiveIndex:
10029
typeId = builder.makeIntType(32);
10030
opCode = spv::Op::OpRayQueryGetIntersectionPrimitiveIndexKHR;
10031
break;
10032
case glslang::EOpRayQueryGetIntersectionBarycentrics:
10033
typeId = builder.makeVectorType(builder.makeFloatType(32), 2);
10034
opCode = spv::Op::OpRayQueryGetIntersectionBarycentricsKHR;
10035
break;
10036
case glslang::EOpRayQueryGetIntersectionFrontFace:
10037
typeId = builder.makeBoolType();
10038
opCode = spv::Op::OpRayQueryGetIntersectionFrontFaceKHR;
10039
break;
10040
case glslang::EOpRayQueryGetIntersectionCandidateAABBOpaque:
10041
typeId = builder.makeBoolType();
10042
opCode = spv::Op::OpRayQueryGetIntersectionCandidateAABBOpaqueKHR;
10043
break;
10044
case glslang::EOpRayQueryGetIntersectionObjectRayDirection:
10045
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10046
opCode = spv::Op::OpRayQueryGetIntersectionObjectRayDirectionKHR;
10047
break;
10048
case glslang::EOpRayQueryGetIntersectionObjectRayOrigin:
10049
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10050
opCode = spv::Op::OpRayQueryGetIntersectionObjectRayOriginKHR;
10051
break;
10052
case glslang::EOpRayQueryGetWorldRayDirection:
10053
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10054
opCode = spv::Op::OpRayQueryGetWorldRayDirectionKHR;
10055
break;
10056
case glslang::EOpRayQueryGetWorldRayOrigin:
10057
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10058
opCode = spv::Op::OpRayQueryGetWorldRayOriginKHR;
10059
break;
10060
case glslang::EOpRayQueryGetIntersectionObjectToWorld:
10061
typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
10062
opCode = spv::Op::OpRayQueryGetIntersectionObjectToWorldKHR;
10063
break;
10064
case glslang::EOpRayQueryGetIntersectionClusterIdNV:
10065
typeId = builder.makeIntegerType(32, 1);
10066
opCode = spv::Op::OpRayQueryGetClusterIdNV;
10067
break;
10068
case glslang::EOpRayQueryGetIntersectionWorldToObject:
10069
typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
10070
opCode = spv::Op::OpRayQueryGetIntersectionWorldToObjectKHR;
10071
break;
10072
case glslang::EOpRayQueryGetIntersectionSpherePositionNV:
10073
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10074
opCode = spv::Op::OpRayQueryGetIntersectionSpherePositionNV;
10075
break;
10076
case glslang::EOpRayQueryGetIntersectionSphereRadiusNV:
10077
typeId = builder.makeFloatType(32);
10078
opCode = spv::Op::OpRayQueryGetIntersectionSphereRadiusNV;
10079
break;
10080
case glslang::EOpRayQueryGetIntersectionLSSHitValueNV:
10081
typeId = builder.makeFloatType(32);
10082
opCode = spv::Op::OpRayQueryGetIntersectionLSSHitValueNV;
10083
break;
10084
case glslang::EOpRayQueryIsSphereHitNV:
10085
typeId = builder.makeBoolType();
10086
opCode = spv::Op::OpRayQueryIsSphereHitNV;
10087
break;
10088
case glslang::EOpRayQueryIsLSSHitNV:
10089
typeId = builder.makeBoolType();
10090
opCode = spv::Op::OpRayQueryIsLSSHitNV;
10091
break;
10092
case glslang::EOpWritePackedPrimitiveIndices4x8NV:
10093
builder.createNoResultOp(spv::Op::OpWritePackedPrimitiveIndices4x8NV, operands);
10094
return 0;
10095
case glslang::EOpEmitMeshTasksEXT:
10096
if (taskPayloadID)
10097
operands.push_back(taskPayloadID);
10098
// As per SPV_EXT_mesh_shader make it a terminating instruction in the current block
10099
builder.makeStatementTerminator(spv::Op::OpEmitMeshTasksEXT, operands, "post-OpEmitMeshTasksEXT");
10100
return 0;
10101
case glslang::EOpSetMeshOutputsEXT:
10102
builder.createNoResultOp(spv::Op::OpSetMeshOutputsEXT, operands);
10103
return 0;
10104
case glslang::EOpCooperativeMatrixMulAddNV:
10105
opCode = spv::Op::OpCooperativeMatrixMulAddNV;
10106
break;
10107
case glslang::EOpHitObjectTraceRayNV:
10108
builder.createNoResultOp(spv::Op::OpHitObjectTraceRayNV, operands);
10109
return 0;
10110
case glslang::EOpHitObjectTraceRayEXT:
10111
builder.createNoResultOp(spv::Op::OpHitObjectTraceRayEXT, operands);
10112
return 0;
10113
case glslang::EOpHitObjectTraceRayMotionNV:
10114
builder.createNoResultOp(spv::Op::OpHitObjectTraceRayMotionNV, operands);
10115
return 0;
10116
case glslang::EOpHitObjectTraceRayMotionEXT:
10117
builder.createNoResultOp(spv::Op::OpHitObjectTraceRayMotionEXT, operands);
10118
return 0;
10119
case glslang::EOpHitObjectRecordHitNV:
10120
builder.createNoResultOp(spv::Op::OpHitObjectRecordHitNV, operands);
10121
return 0;
10122
case glslang::EOpHitObjectRecordHitMotionNV:
10123
builder.createNoResultOp(spv::Op::OpHitObjectRecordHitMotionNV, operands);
10124
return 0;
10125
case glslang::EOpHitObjectRecordHitWithIndexNV:
10126
builder.createNoResultOp(spv::Op::OpHitObjectRecordHitWithIndexNV, operands);
10127
return 0;
10128
case glslang::EOpHitObjectRecordHitWithIndexMotionNV:
10129
builder.createNoResultOp(spv::Op::OpHitObjectRecordHitWithIndexMotionNV, operands);
10130
return 0;
10131
case glslang::EOpHitObjectRecordMissNV:
10132
builder.createNoResultOp(spv::Op::OpHitObjectRecordMissNV, operands);
10133
return 0;
10134
case glslang::EOpHitObjectRecordMissEXT:
10135
builder.createNoResultOp(spv::Op::OpHitObjectRecordMissEXT, operands);
10136
return 0;
10137
case glslang::EOpHitObjectRecordMissMotionNV:
10138
builder.createNoResultOp(spv::Op::OpHitObjectRecordMissMotionNV, operands);
10139
return 0;
10140
case glslang::EOpHitObjectRecordMissMotionEXT:
10141
builder.createNoResultOp(spv::Op::OpHitObjectRecordMissMotionEXT, operands);
10142
return 0;
10143
case glslang::EOpHitObjectExecuteShaderNV:
10144
builder.createNoResultOp(spv::Op::OpHitObjectExecuteShaderNV, operands);
10145
return 0;
10146
case glslang::EOpHitObjectExecuteShaderEXT:
10147
builder.createNoResultOp(spv::Op::OpHitObjectExecuteShaderEXT, operands);
10148
return 0;
10149
case glslang::EOpHitObjectIsEmptyNV:
10150
typeId = builder.makeBoolType();
10151
opCode = spv::Op::OpHitObjectIsEmptyNV;
10152
break;
10153
case glslang::EOpHitObjectIsEmptyEXT:
10154
typeId = builder.makeBoolType();
10155
opCode = spv::Op::OpHitObjectIsEmptyEXT;
10156
break;
10157
case glslang::EOpHitObjectIsMissNV:
10158
typeId = builder.makeBoolType();
10159
opCode = spv::Op::OpHitObjectIsMissNV;
10160
break;
10161
case glslang::EOpHitObjectIsMissEXT:
10162
typeId = builder.makeBoolType();
10163
opCode = spv::Op::OpHitObjectIsMissEXT;
10164
break;
10165
case glslang::EOpHitObjectIsHitNV:
10166
typeId = builder.makeBoolType();
10167
opCode = spv::Op::OpHitObjectIsHitNV;
10168
break;
10169
case glslang::EOpHitObjectIsSphereHitNV:
10170
typeId = builder.makeBoolType();
10171
opCode = spv::Op::OpHitObjectIsSphereHitNV;
10172
break;
10173
case glslang::EOpHitObjectIsLSSHitNV:
10174
typeId = builder.makeBoolType();
10175
opCode = spv::Op::OpHitObjectIsLSSHitNV;
10176
break;
10177
case glslang::EOpHitObjectIsHitEXT:
10178
typeId = builder.makeBoolType();
10179
opCode = spv::Op::OpHitObjectIsHitEXT;
10180
break;
10181
case glslang::EOpHitObjectGetRayTMinNV:
10182
typeId = builder.makeFloatType(32);
10183
opCode = spv::Op::OpHitObjectGetRayTMinNV;
10184
break;
10185
case glslang::EOpHitObjectGetRayTMinEXT:
10186
typeId = builder.makeFloatType(32);
10187
opCode = spv::Op::OpHitObjectGetRayTMinEXT;
10188
break;
10189
case glslang::EOpHitObjectGetRayTMaxNV:
10190
typeId = builder.makeFloatType(32);
10191
opCode = spv::Op::OpHitObjectGetRayTMaxNV;
10192
break;
10193
case glslang::EOpHitObjectGetRayTMaxEXT:
10194
typeId = builder.makeFloatType(32);
10195
opCode = spv::Op::OpHitObjectGetRayTMaxEXT;
10196
break;
10197
case glslang::EOpHitObjectGetRayFlagsEXT:
10198
typeId = builder.makeIntegerType(32, 0);
10199
opCode = spv::Op::OpHitObjectGetRayFlagsEXT;
10200
break;
10201
case glslang::EOpHitObjectGetObjectRayOriginNV:
10202
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10203
opCode = spv::Op::OpHitObjectGetObjectRayOriginNV;
10204
break;
10205
case glslang::EOpHitObjectGetObjectRayOriginEXT:
10206
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10207
opCode = spv::Op::OpHitObjectGetObjectRayOriginEXT;
10208
break;
10209
case glslang::EOpHitObjectGetObjectRayDirectionNV:
10210
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10211
opCode = spv::Op::OpHitObjectGetObjectRayDirectionNV;
10212
break;
10213
case glslang::EOpHitObjectGetObjectRayDirectionEXT:
10214
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10215
opCode = spv::Op::OpHitObjectGetObjectRayDirectionEXT;
10216
break;
10217
case glslang::EOpHitObjectGetWorldRayOriginNV:
10218
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10219
opCode = spv::Op::OpHitObjectGetWorldRayOriginNV;
10220
break;
10221
case glslang::EOpHitObjectGetWorldRayOriginEXT:
10222
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10223
opCode = spv::Op::OpHitObjectGetWorldRayOriginEXT;
10224
break;
10225
case glslang::EOpHitObjectGetWorldRayDirectionNV:
10226
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10227
opCode = spv::Op::OpHitObjectGetWorldRayDirectionNV;
10228
break;
10229
case glslang::EOpHitObjectGetWorldRayDirectionEXT:
10230
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10231
opCode = spv::Op::OpHitObjectGetWorldRayDirectionEXT;
10232
break;
10233
case glslang::EOpHitObjectGetWorldToObjectNV:
10234
typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
10235
opCode = spv::Op::OpHitObjectGetWorldToObjectNV;
10236
break;
10237
case glslang::EOpHitObjectGetWorldToObjectEXT:
10238
typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
10239
opCode = spv::Op::OpHitObjectGetWorldToObjectEXT;
10240
break;
10241
case glslang::EOpHitObjectGetObjectToWorldNV:
10242
typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
10243
opCode = spv::Op::OpHitObjectGetObjectToWorldNV;
10244
break;
10245
case glslang::EOpHitObjectGetObjectToWorldEXT:
10246
typeId = builder.makeMatrixType(builder.makeFloatType(32), 4, 3);
10247
opCode = spv::Op::OpHitObjectGetObjectToWorldEXT;
10248
break;
10249
case glslang::EOpHitObjectGetInstanceCustomIndexNV:
10250
typeId = builder.makeIntegerType(32, 1);
10251
opCode = spv::Op::OpHitObjectGetInstanceCustomIndexNV;
10252
break;
10253
case glslang::EOpHitObjectGetInstanceCustomIndexEXT:
10254
typeId = builder.makeIntegerType(32, 1);
10255
opCode = spv::Op::OpHitObjectGetInstanceCustomIndexEXT;
10256
break;
10257
case glslang::EOpHitObjectGetInstanceIdNV:
10258
typeId = builder.makeIntegerType(32, 1);
10259
opCode = spv::Op::OpHitObjectGetInstanceIdNV;
10260
break;
10261
case glslang::EOpHitObjectGetInstanceIdEXT:
10262
typeId = builder.makeIntegerType(32, 1);
10263
opCode = spv::Op::OpHitObjectGetInstanceIdEXT;
10264
break;
10265
case glslang::EOpHitObjectGetGeometryIndexNV:
10266
typeId = builder.makeIntegerType(32, 1);
10267
opCode = spv::Op::OpHitObjectGetGeometryIndexNV;
10268
break;
10269
case glslang::EOpHitObjectGetGeometryIndexEXT:
10270
typeId = builder.makeIntegerType(32, 1);
10271
opCode = spv::Op::OpHitObjectGetGeometryIndexEXT;
10272
break;
10273
case glslang::EOpHitObjectGetPrimitiveIndexNV:
10274
typeId = builder.makeIntegerType(32, 1);
10275
opCode = spv::Op::OpHitObjectGetPrimitiveIndexNV;
10276
break;
10277
case glslang::EOpHitObjectGetPrimitiveIndexEXT:
10278
typeId = builder.makeIntegerType(32, 1);
10279
opCode = spv::Op::OpHitObjectGetPrimitiveIndexEXT;
10280
break;
10281
case glslang::EOpHitObjectGetHitKindNV:
10282
typeId = builder.makeIntegerType(32, 0);
10283
opCode = spv::Op::OpHitObjectGetHitKindNV;
10284
break;
10285
case glslang::EOpHitObjectGetHitKindEXT:
10286
typeId = builder.makeIntegerType(32, 0);
10287
opCode = spv::Op::OpHitObjectGetHitKindEXT;
10288
break;
10289
case glslang::EOpHitObjectGetCurrentTimeNV:
10290
typeId = builder.makeFloatType(32);
10291
opCode = spv::Op::OpHitObjectGetCurrentTimeNV;
10292
break;
10293
case glslang::EOpHitObjectGetCurrentTimeEXT:
10294
typeId = builder.makeFloatType(32);
10295
opCode = spv::Op::OpHitObjectGetCurrentTimeEXT;
10296
break;
10297
case glslang::EOpHitObjectGetShaderBindingTableRecordIndexNV:
10298
typeId = builder.makeIntegerType(32, 0);
10299
opCode = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexNV;
10300
return 0;
10301
case glslang::EOpHitObjectGetShaderBindingTableRecordIndexEXT:
10302
typeId = builder.makeIntegerType(32, 0);
10303
opCode = spv::Op::OpHitObjectGetShaderBindingTableRecordIndexEXT;
10304
return 0;
10305
case glslang::EOpHitObjectGetAttributesNV:
10306
builder.createNoResultOp(spv::Op::OpHitObjectGetAttributesNV, operands);
10307
return 0;
10308
case glslang::EOpHitObjectGetAttributesEXT:
10309
builder.createNoResultOp(spv::Op::OpHitObjectGetAttributesEXT, operands);
10310
return 0;
10311
case glslang::EOpHitObjectRecordFromQueryEXT:
10312
builder.createNoResultOp(spv::Op::OpHitObjectRecordFromQueryEXT, operands);
10313
return 0;
10314
case glslang::EOpHitObjectGetShaderRecordBufferHandleNV:
10315
typeId = builder.makeVectorType(builder.makeUintType(32), 2);
10316
opCode = spv::Op::OpHitObjectGetShaderRecordBufferHandleNV;
10317
break;
10318
case glslang::EOpHitObjectGetClusterIdNV:
10319
typeId = builder.makeIntegerType(32, 1);
10320
opCode = spv::Op::OpHitObjectGetClusterIdNV;
10321
break;
10322
case glslang::EOpHitObjectGetShaderRecordBufferHandleEXT:
10323
typeId = builder.makeVectorType(builder.makeUintType(32), 2);
10324
opCode = spv::Op::OpHitObjectGetShaderRecordBufferHandleEXT;
10325
break;
10326
case glslang::EOpHitObjectSetShaderBindingTableRecordIndexEXT:
10327
builder.createNoResultOp(spv::Op::OpHitObjectSetShaderBindingTableRecordIndexEXT, operands);
10328
return 0;
10329
case glslang::EOpReorderThreadNV: {
10330
if (operands.size() == 2) {
10331
builder.createNoResultOp(spv::Op::OpReorderThreadWithHintNV, operands);
10332
} else {
10333
builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectNV, operands);
10334
}
10335
return 0;
10336
}
10337
case glslang::EOpReorderThreadEXT: {
10338
if (operands.size() == 2) {
10339
builder.createNoResultOp(spv::Op::OpReorderThreadWithHintEXT, operands);
10340
} else {
10341
builder.createNoResultOp(spv::Op::OpReorderThreadWithHitObjectEXT, operands);
10342
}
10343
return 0;
10344
}
10345
10346
case glslang::EOpHitObjectReorderExecuteEXT: {
10347
if (operands.size() == 2) {
10348
builder.createNoResultOp(spv::Op::OpHitObjectReorderExecuteShaderEXT, operands);
10349
} else {
10350
// GLSL intrinsic is
10351
// hitObjectReorderExecuteEXT(hitObjectEXT hitObject, uint hint, uint bits,int payload) while
10352
// SPIRV is hitObject id , payload id, optional hint id, optional bits id hence reorder operands
10353
builder.createNoResultOp(spv::Op::OpHitObjectReorderExecuteShaderEXT, {operands[0], operands[3], operands[1], operands[2]});
10354
}
10355
return 0;
10356
}
10357
10358
case glslang::EOpHitObjectTraceReorderExecuteEXT: {
10359
if (operands.size() == 12) {
10360
builder.createNoResultOp(spv::Op::OpHitObjectTraceReorderExecuteEXT, operands);
10361
} else {
10362
std::vector<spv::Id> argOperands;
10363
std::copy(operands.begin(), operands.begin() + 11, std::back_inserter(argOperands));
10364
argOperands.push_back(operands[13]);
10365
argOperands.push_back(operands[11]);
10366
argOperands.push_back(operands[12]);
10367
builder.createNoResultOp(spv::Op::OpHitObjectTraceReorderExecuteEXT, argOperands);
10368
}
10369
return 0;
10370
}
10371
case glslang::EOpHitObjectTraceMotionReorderExecuteEXT: {
10372
if (operands.size() == 13) {
10373
builder.createNoResultOp(spv::Op::OpHitObjectTraceMotionReorderExecuteEXT, operands);
10374
} else {
10375
std::vector<spv::Id> argOperands;
10376
std::copy(operands.begin(), operands.begin() + 12, std::back_inserter(argOperands));
10377
argOperands.push_back(operands[14]);
10378
argOperands.push_back(operands[12]);
10379
argOperands.push_back(operands[13]);
10380
builder.createNoResultOp(spv::Op::OpHitObjectTraceMotionReorderExecuteEXT, argOperands);
10381
}
10382
return 0;
10383
}
10384
case glslang::EOpImageSampleWeightedQCOM:
10385
typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
10386
opCode = spv::Op::OpImageSampleWeightedQCOM;
10387
addImageProcessingQCOMDecoration(operands[2], spv::Decoration::WeightTextureQCOM);
10388
break;
10389
case glslang::EOpImageBoxFilterQCOM:
10390
typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
10391
opCode = spv::Op::OpImageBoxFilterQCOM;
10392
break;
10393
case glslang::EOpImageBlockMatchSADQCOM:
10394
typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
10395
opCode = spv::Op::OpImageBlockMatchSADQCOM;
10396
addImageProcessingQCOMDecoration(operands[0], spv::Decoration::BlockMatchTextureQCOM);
10397
addImageProcessingQCOMDecoration(operands[2], spv::Decoration::BlockMatchTextureQCOM);
10398
break;
10399
case glslang::EOpImageBlockMatchSSDQCOM:
10400
typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
10401
opCode = spv::Op::OpImageBlockMatchSSDQCOM;
10402
addImageProcessingQCOMDecoration(operands[0], spv::Decoration::BlockMatchTextureQCOM);
10403
addImageProcessingQCOMDecoration(operands[2], spv::Decoration::BlockMatchTextureQCOM);
10404
break;
10405
10406
case glslang::EOpFetchMicroTriangleVertexBarycentricNV:
10407
typeId = builder.makeVectorType(builder.makeFloatType(32), 2);
10408
opCode = spv::Op::OpFetchMicroTriangleVertexBarycentricNV;
10409
break;
10410
10411
case glslang::EOpFetchMicroTriangleVertexPositionNV:
10412
typeId = builder.makeVectorType(builder.makeFloatType(32), 3);
10413
opCode = spv::Op::OpFetchMicroTriangleVertexPositionNV;
10414
break;
10415
10416
case glslang::EOpImageBlockMatchWindowSSDQCOM:
10417
typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
10418
opCode = spv::Op::OpImageBlockMatchWindowSSDQCOM;
10419
addImageProcessing2QCOMDecoration(operands[0], false);
10420
addImageProcessing2QCOMDecoration(operands[2], false);
10421
break;
10422
case glslang::EOpImageBlockMatchWindowSADQCOM:
10423
typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
10424
opCode = spv::Op::OpImageBlockMatchWindowSADQCOM;
10425
addImageProcessing2QCOMDecoration(operands[0], false);
10426
addImageProcessing2QCOMDecoration(operands[2], false);
10427
break;
10428
case glslang::EOpImageBlockMatchGatherSSDQCOM:
10429
typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
10430
opCode = spv::Op::OpImageBlockMatchGatherSSDQCOM;
10431
addImageProcessing2QCOMDecoration(operands[0], true);
10432
addImageProcessing2QCOMDecoration(operands[2], true);
10433
break;
10434
case glslang::EOpImageBlockMatchGatherSADQCOM:
10435
typeId = builder.makeVectorType(builder.makeFloatType(32), 4);
10436
opCode = spv::Op::OpImageBlockMatchGatherSADQCOM;
10437
addImageProcessing2QCOMDecoration(operands[0], true);
10438
addImageProcessing2QCOMDecoration(operands[2], true);
10439
break;
10440
case glslang::EOpCreateTensorLayoutNV:
10441
return builder.createOp(spv::Op::OpCreateTensorLayoutNV, typeId, std::vector<spv::Id>{});
10442
case glslang::EOpCreateTensorViewNV:
10443
return builder.createOp(spv::Op::OpCreateTensorViewNV, typeId, std::vector<spv::Id>{});
10444
case glslang::EOpTensorLayoutSetBlockSizeNV:
10445
opCode = spv::Op::OpTensorLayoutSetBlockSizeNV;
10446
break;
10447
case glslang::EOpTensorLayoutSetDimensionNV:
10448
opCode = spv::Op::OpTensorLayoutSetDimensionNV;
10449
break;
10450
case glslang::EOpTensorLayoutSetStrideNV:
10451
opCode = spv::Op::OpTensorLayoutSetStrideNV;
10452
break;
10453
case glslang::EOpTensorLayoutSliceNV:
10454
opCode = spv::Op::OpTensorLayoutSliceNV;
10455
break;
10456
case glslang::EOpTensorLayoutSetClampValueNV:
10457
opCode = spv::Op::OpTensorLayoutSetClampValueNV;
10458
break;
10459
case glslang::EOpTensorViewSetDimensionNV:
10460
opCode = spv::Op::OpTensorViewSetDimensionNV;
10461
break;
10462
case glslang::EOpTensorViewSetStrideNV:
10463
opCode = spv::Op::OpTensorViewSetStrideNV;
10464
break;
10465
case glslang::EOpTensorViewSetClipNV:
10466
opCode = spv::Op::OpTensorViewSetClipNV;
10467
break;
10468
default:
10469
return 0;
10470
}
10471
10472
spv::Id id = 0;
10473
if (libCall >= 0) {
10474
// Use an extended instruction from the standard library.
10475
// Construct the call arguments, without modifying the original operands vector.
10476
// We might need the remaining arguments, e.g. in the EOpFrexp case.
10477
std::vector<spv::Id> callArguments(operands.begin(), operands.begin() + consumedOperands);
10478
id = builder.createBuiltinCall(typeId, extBuiltins >= 0 ? extBuiltins : stdBuiltins, libCall, callArguments);
10479
} else if (opCode == spv::Op::OpDot && !isFloat) {
10480
// int dot(int, int)
10481
// NOTE: never called for scalar/vector1, this is turned into simple mul before this can be reached
10482
const int componentCount = builder.getNumComponents(operands[0]);
10483
spv::Id mulOp = builder.createBinOp(spv::Op::OpIMul, builder.getTypeId(operands[0]), operands[0], operands[1]);
10484
builder.setPrecision(mulOp, precision);
10485
id = builder.createCompositeExtract(mulOp, typeId, 0);
10486
for (int i = 1; i < componentCount; ++i) {
10487
builder.setPrecision(id, precision);
10488
id = builder.createBinOp(spv::Op::OpIAdd, typeId, id, builder.createCompositeExtract(mulOp, typeId, i));
10489
}
10490
} else {
10491
switch (consumedOperands) {
10492
case 0:
10493
// should all be handled by visitAggregate and createNoArgOperation
10494
assert(0);
10495
return 0;
10496
case 1:
10497
// should all be handled by createUnaryOperation
10498
assert(0);
10499
return 0;
10500
case 2:
10501
id = builder.createBinOp(opCode, typeId, operands[0], operands[1]);
10502
break;
10503
default:
10504
// anything 3 or over doesn't have l-value operands, so all should be consumed
10505
assert(consumedOperands == operands.size());
10506
id = builder.createOp(opCode, typeId, operands);
10507
break;
10508
}
10509
}
10510
10511
// Decode the return types that were structures
10512
switch (op) {
10513
case glslang::EOpAddCarry:
10514
case glslang::EOpSubBorrow:
10515
builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);
10516
id = builder.createCompositeExtract(id, typeId0, 0);
10517
break;
10518
case glslang::EOpUMulExtended:
10519
case glslang::EOpIMulExtended:
10520
builder.createStore(builder.createCompositeExtract(id, typeId0, 0), operands[3]);
10521
builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[2]);
10522
break;
10523
case glslang::EOpModf:
10524
{
10525
assert(operands.size() == 2);
10526
builder.createStore(builder.createCompositeExtract(id, typeId0, 1), operands[1]);
10527
id = builder.createCompositeExtract(id, typeId0, 0);
10528
}
10529
break;
10530
case glslang::EOpFrexp:
10531
{
10532
assert(operands.size() == 2);
10533
if (builder.isFloatType(builder.getScalarTypeId(typeId1))) {
10534
// "exp" is floating-point type (from HLSL intrinsic)
10535
spv::Id member1 = builder.createCompositeExtract(id, frexpIntType, 1);
10536
member1 = builder.createUnaryOp(spv::Op::OpConvertSToF, typeId1, member1);
10537
builder.createStore(member1, operands[1]);
10538
} else
10539
// "exp" is integer type (from GLSL built-in function)
10540
builder.createStore(builder.createCompositeExtract(id, frexpIntType, 1), operands[1]);
10541
id = builder.createCompositeExtract(id, typeId0, 0);
10542
}
10543
break;
10544
default:
10545
break;
10546
}
10547
10548
return builder.setPrecision(id, precision);
10549
}
10550
10551
// Intrinsics with no arguments (or no return value, and no precision).
10552
spv::Id TGlslangToSpvTraverser::createNoArgOperation(glslang::TOperator op, spv::Decoration precision, spv::Id typeId)
10553
{
10554
// GLSL memory barriers use queuefamily scope in new model, device scope in old model
10555
spv::Scope memoryBarrierScope = glslangIntermediate->usingVulkanMemoryModel() ?
10556
spv::Scope::QueueFamilyKHR : spv::Scope::Device;
10557
10558
switch (op) {
10559
case glslang::EOpBarrier:
10560
if (glslangIntermediate->getStage() == EShLangTessControl) {
10561
if (glslangIntermediate->usingVulkanMemoryModel()) {
10562
builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
10563
spv::MemorySemanticsMask::OutputMemoryKHR |
10564
spv::MemorySemanticsMask::AcquireRelease);
10565
builder.addCapability(spv::Capability::VulkanMemoryModelKHR);
10566
} else {
10567
builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Invocation, spv::MemorySemanticsMask::MaskNone);
10568
}
10569
} else {
10570
builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
10571
spv::MemorySemanticsMask::WorkgroupMemory |
10572
spv::MemorySemanticsMask::AcquireRelease);
10573
}
10574
return 0;
10575
case glslang::EOpMemoryBarrier:
10576
builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsAllMemory |
10577
spv::MemorySemanticsMask::AcquireRelease);
10578
return 0;
10579
case glslang::EOpMemoryBarrierBuffer:
10580
builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::UniformMemory |
10581
spv::MemorySemanticsMask::AcquireRelease);
10582
return 0;
10583
case glslang::EOpMemoryBarrierShared:
10584
builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::WorkgroupMemory |
10585
spv::MemorySemanticsMask::AcquireRelease);
10586
return 0;
10587
case glslang::EOpGroupMemoryBarrier:
10588
builder.createMemoryBarrier(spv::Scope::Workgroup, spv::MemorySemanticsAllMemory |
10589
spv::MemorySemanticsMask::AcquireRelease);
10590
return 0;
10591
case glslang::EOpMemoryBarrierAtomicCounter:
10592
builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::AtomicCounterMemory |
10593
spv::MemorySemanticsMask::AcquireRelease);
10594
return 0;
10595
case glslang::EOpMemoryBarrierImage:
10596
builder.createMemoryBarrier(memoryBarrierScope, spv::MemorySemanticsMask::ImageMemory |
10597
spv::MemorySemanticsMask::AcquireRelease);
10598
return 0;
10599
case glslang::EOpAllMemoryBarrierWithGroupSync:
10600
builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Device,
10601
spv::MemorySemanticsAllMemory |
10602
spv::MemorySemanticsMask::AcquireRelease);
10603
return 0;
10604
case glslang::EOpDeviceMemoryBarrier:
10605
builder.createMemoryBarrier(spv::Scope::Device, spv::MemorySemanticsMask::UniformMemory |
10606
spv::MemorySemanticsMask::ImageMemory |
10607
spv::MemorySemanticsMask::AcquireRelease);
10608
return 0;
10609
case glslang::EOpDeviceMemoryBarrierWithGroupSync:
10610
builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Device, spv::MemorySemanticsMask::UniformMemory |
10611
spv::MemorySemanticsMask::ImageMemory |
10612
spv::MemorySemanticsMask::AcquireRelease);
10613
return 0;
10614
case glslang::EOpWorkgroupMemoryBarrier:
10615
builder.createMemoryBarrier(spv::Scope::Workgroup, spv::MemorySemanticsMask::WorkgroupMemory |
10616
spv::MemorySemanticsMask::AcquireRelease);
10617
return 0;
10618
case glslang::EOpWorkgroupMemoryBarrierWithGroupSync:
10619
builder.createControlBarrier(spv::Scope::Workgroup, spv::Scope::Workgroup,
10620
spv::MemorySemanticsMask::WorkgroupMemory |
10621
spv::MemorySemanticsMask::AcquireRelease);
10622
return 0;
10623
case glslang::EOpSubgroupBarrier:
10624
builder.createControlBarrier(spv::Scope::Subgroup, spv::Scope::Subgroup, spv::MemorySemanticsAllMemory |
10625
spv::MemorySemanticsMask::AcquireRelease);
10626
return spv::NoResult;
10627
case glslang::EOpSubgroupMemoryBarrier:
10628
builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsAllMemory |
10629
spv::MemorySemanticsMask::AcquireRelease);
10630
return spv::NoResult;
10631
case glslang::EOpSubgroupMemoryBarrierBuffer:
10632
builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::UniformMemory |
10633
spv::MemorySemanticsMask::AcquireRelease);
10634
return spv::NoResult;
10635
case glslang::EOpSubgroupMemoryBarrierImage:
10636
builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::ImageMemory |
10637
spv::MemorySemanticsMask::AcquireRelease);
10638
return spv::NoResult;
10639
case glslang::EOpSubgroupMemoryBarrierShared:
10640
builder.createMemoryBarrier(spv::Scope::Subgroup, spv::MemorySemanticsMask::WorkgroupMemory |
10641
spv::MemorySemanticsMask::AcquireRelease);
10642
return spv::NoResult;
10643
10644
case glslang::EOpEmitVertex:
10645
builder.createNoResultOp(spv::Op::OpEmitVertex);
10646
return 0;
10647
case glslang::EOpEndPrimitive:
10648
builder.createNoResultOp(spv::Op::OpEndPrimitive);
10649
return 0;
10650
10651
case glslang::EOpSubgroupElect: {
10652
std::vector<spv::Id> operands;
10653
return createSubgroupOperation(op, typeId, operands, glslang::EbtVoid);
10654
}
10655
case glslang::EOpTime:
10656
{
10657
std::vector<spv::Id> args; // Dummy arguments
10658
spv::Id id = builder.createBuiltinCall(typeId, getExtBuiltins(spv::E_SPV_AMD_gcn_shader), spv::TimeAMD, args);
10659
return builder.setPrecision(id, precision);
10660
}
10661
case glslang::EOpIgnoreIntersectionNV:
10662
builder.createNoResultOp(spv::Op::OpIgnoreIntersectionNV);
10663
return 0;
10664
case glslang::EOpTerminateRayNV:
10665
builder.createNoResultOp(spv::Op::OpTerminateRayNV);
10666
return 0;
10667
case glslang::EOpRayQueryInitialize:
10668
builder.createNoResultOp(spv::Op::OpRayQueryInitializeKHR);
10669
return 0;
10670
case glslang::EOpRayQueryTerminate:
10671
builder.createNoResultOp(spv::Op::OpRayQueryTerminateKHR);
10672
return 0;
10673
case glslang::EOpRayQueryGenerateIntersection:
10674
builder.createNoResultOp(spv::Op::OpRayQueryGenerateIntersectionKHR);
10675
return 0;
10676
case glslang::EOpRayQueryConfirmIntersection:
10677
builder.createNoResultOp(spv::Op::OpRayQueryConfirmIntersectionKHR);
10678
return 0;
10679
case glslang::EOpBeginInvocationInterlock:
10680
builder.createNoResultOp(spv::Op::OpBeginInvocationInterlockEXT);
10681
return 0;
10682
case glslang::EOpEndInvocationInterlock:
10683
builder.createNoResultOp(spv::Op::OpEndInvocationInterlockEXT);
10684
return 0;
10685
10686
case glslang::EOpIsHelperInvocation:
10687
{
10688
std::vector<spv::Id> args; // Dummy arguments
10689
builder.addExtension(spv::E_SPV_EXT_demote_to_helper_invocation);
10690
builder.addCapability(spv::Capability::DemoteToHelperInvocationEXT);
10691
return builder.createOp(spv::Op::OpIsHelperInvocationEXT, typeId, args);
10692
}
10693
10694
case glslang::EOpReadClockSubgroupKHR: {
10695
std::vector<spv::Id> args;
10696
args.push_back(builder.makeUintConstant(spv::Scope::Subgroup));
10697
builder.addExtension(spv::E_SPV_KHR_shader_clock);
10698
builder.addCapability(spv::Capability::ShaderClockKHR);
10699
return builder.createOp(spv::Op::OpReadClockKHR, typeId, args);
10700
}
10701
10702
case glslang::EOpReadClockDeviceKHR: {
10703
std::vector<spv::Id> args;
10704
args.push_back(builder.makeUintConstant(spv::Scope::Device));
10705
builder.addExtension(spv::E_SPV_KHR_shader_clock);
10706
builder.addCapability(spv::Capability::ShaderClockKHR);
10707
return builder.createOp(spv::Op::OpReadClockKHR, typeId, args);
10708
}
10709
case glslang::EOpStencilAttachmentReadEXT:
10710
case glslang::EOpDepthAttachmentReadEXT:
10711
{
10712
builder.addExtension(spv::E_SPV_EXT_shader_tile_image);
10713
10714
spv::Decoration precision;
10715
spv::Op spv_op;
10716
if (op == glslang::EOpStencilAttachmentReadEXT)
10717
{
10718
precision = spv::Decoration::RelaxedPrecision;
10719
spv_op = spv::Op::OpStencilAttachmentReadEXT;
10720
builder.addCapability(spv::Capability::TileImageStencilReadAccessEXT);
10721
}
10722
else
10723
{
10724
precision = spv::NoPrecision;
10725
spv_op = spv::Op::OpDepthAttachmentReadEXT;
10726
builder.addCapability(spv::Capability::TileImageDepthReadAccessEXT);
10727
}
10728
10729
std::vector<spv::Id> args; // Dummy args
10730
spv::Id result = builder.createOp(spv_op, typeId, args);
10731
return builder.setPrecision(result, precision);
10732
}
10733
default:
10734
break;
10735
}
10736
10737
logger->missingFunctionality("unknown operation with no arguments");
10738
10739
return 0;
10740
}
10741
10742
spv::Id TGlslangToSpvTraverser::getSymbolId(const glslang::TIntermSymbol* symbol)
10743
{
10744
auto iter = symbolValues.find(symbol->getId());
10745
spv::Id id;
10746
if (symbolValues.end() != iter) {
10747
id = iter->second;
10748
return id;
10749
}
10750
10751
// it was not found, create it
10752
spv::BuiltIn builtIn = TranslateBuiltInDecoration(symbol->getQualifier().builtIn, false);
10753
auto forcedType = getForcedType(symbol->getQualifier().builtIn, symbol->getType());
10754
10755
// There are pairs of symbols that map to the same SPIR-V built-in:
10756
// gl_ObjectToWorldEXT and gl_ObjectToWorld3x4EXT, and gl_WorldToObjectEXT
10757
// and gl_WorldToObject3x4EXT. SPIR-V forbids having two OpVariables
10758
// with the same BuiltIn in the same storage class, so we must re-use one.
10759
const bool mayNeedToReuseBuiltIn =
10760
builtIn == spv::BuiltIn::ObjectToWorldKHR ||
10761
builtIn == spv::BuiltIn::WorldToObjectKHR;
10762
10763
if (mayNeedToReuseBuiltIn) {
10764
auto iter = builtInVariableIds.find(uint32_t(builtIn));
10765
if (builtInVariableIds.end() != iter) {
10766
id = iter->second;
10767
symbolValues[symbol->getId()] = id;
10768
if (forcedType.second != spv::NoType)
10769
forceType[id] = forcedType.second;
10770
return id;
10771
}
10772
}
10773
10774
if (symbol->getBasicType() == glslang::EbtFunction) {
10775
return 0;
10776
}
10777
10778
id = createSpvVariable(symbol, forcedType.first);
10779
10780
if (mayNeedToReuseBuiltIn) {
10781
builtInVariableIds.insert({uint32_t(builtIn), id});
10782
}
10783
10784
symbolValues[symbol->getId()] = id;
10785
if (forcedType.second != spv::NoType)
10786
forceType[id] = forcedType.second;
10787
10788
if (symbol->getBasicType() != glslang::EbtBlock) {
10789
builder.addDecoration(id, TranslatePrecisionDecoration(symbol->getType()));
10790
builder.addDecoration(id, TranslateInterpolationDecoration(symbol->getType().getQualifier()));
10791
builder.addDecoration(id, TranslateAuxiliaryStorageDecoration(symbol->getType().getQualifier()));
10792
addMeshNVDecoration(id, /*member*/ -1, symbol->getType().getQualifier());
10793
if (symbol->getQualifier().hasComponent())
10794
builder.addDecoration(id, spv::Decoration::Component, symbol->getQualifier().layoutComponent);
10795
if (symbol->getQualifier().hasIndex())
10796
builder.addDecoration(id, spv::Decoration::Index, symbol->getQualifier().layoutIndex);
10797
if (symbol->getType().getQualifier().hasSpecConstantId())
10798
builder.addDecoration(id, spv::Decoration::SpecId, symbol->getType().getQualifier().layoutSpecConstantId);
10799
// atomic counters use this:
10800
if (symbol->getQualifier().hasOffset())
10801
builder.addDecoration(id, spv::Decoration::Offset, symbol->getQualifier().layoutOffset);
10802
}
10803
10804
if (symbol->getQualifier().hasLocation()) {
10805
if (!(glslangIntermediate->isRayTracingStage() &&
10806
(glslangIntermediate->IsRequestedExtension(glslang::E_GL_EXT_ray_tracing) ||
10807
glslangIntermediate->IsRequestedExtension(glslang::E_GL_NV_shader_invocation_reorder) ||
10808
glslangIntermediate->IsRequestedExtension(glslang::E_GL_EXT_shader_invocation_reorder))
10809
&& (builder.getStorageClass(id) == spv::StorageClass::RayPayloadKHR ||
10810
builder.getStorageClass(id) == spv::StorageClass::IncomingRayPayloadKHR ||
10811
builder.getStorageClass(id) == spv::StorageClass::CallableDataKHR ||
10812
builder.getStorageClass(id) == spv::StorageClass::IncomingCallableDataKHR ||
10813
builder.getStorageClass(id) == spv::StorageClass::HitObjectAttributeEXT ||
10814
builder.getStorageClass(id) == spv::StorageClass::HitObjectAttributeNV))) {
10815
// Location values are used to link TraceRayKHR/ExecuteCallableKHR/HitObjectGetAttributesNV
10816
// to corresponding variables but are not valid in SPIRV since they are supported only
10817
// for Input/Output Storage classes.
10818
builder.addDecoration(id, spv::Decoration::Location, symbol->getQualifier().layoutLocation);
10819
}
10820
}
10821
10822
builder.addDecoration(id, TranslateInvariantDecoration(symbol->getType().getQualifier()));
10823
if (symbol->getQualifier().hasStream() && glslangIntermediate->isMultiStream()) {
10824
builder.addCapability(spv::Capability::GeometryStreams);
10825
builder.addDecoration(id, spv::Decoration::Stream, symbol->getQualifier().layoutStream);
10826
}
10827
if (symbol->getQualifier().hasSet())
10828
builder.addDecoration(id, spv::Decoration::DescriptorSet, symbol->getQualifier().layoutSet);
10829
else if (IsDescriptorResource(symbol->getType())) {
10830
// default to 0
10831
builder.addDecoration(id, spv::Decoration::DescriptorSet, 0);
10832
}
10833
if (symbol->getQualifier().hasBinding())
10834
builder.addDecoration(id, spv::Decoration::Binding, symbol->getQualifier().layoutBinding);
10835
else if (IsDescriptorResource(symbol->getType())) {
10836
// default to 0
10837
builder.addDecoration(id, spv::Decoration::Binding, 0);
10838
}
10839
if (symbol->getQualifier().hasAttachment())
10840
builder.addDecoration(id, spv::Decoration::InputAttachmentIndex, symbol->getQualifier().layoutAttachment);
10841
if (glslangIntermediate->getXfbMode()) {
10842
builder.addCapability(spv::Capability::TransformFeedback);
10843
if (symbol->getQualifier().hasXfbBuffer()) {
10844
builder.addDecoration(id, spv::Decoration::XfbBuffer, symbol->getQualifier().layoutXfbBuffer);
10845
unsigned stride = glslangIntermediate->getXfbStride(symbol->getQualifier().layoutXfbBuffer);
10846
if (stride != glslang::TQualifier::layoutXfbStrideEnd)
10847
builder.addDecoration(id, spv::Decoration::XfbStride, stride);
10848
}
10849
if (symbol->getQualifier().hasXfbOffset())
10850
builder.addDecoration(id, spv::Decoration::Offset, symbol->getQualifier().layoutXfbOffset);
10851
}
10852
10853
// add built-in variable decoration
10854
if (builtIn != spv::BuiltIn::Max) {
10855
// WorkgroupSize deprecated in spirv1.6
10856
if (glslangIntermediate->getSpv().spv < glslang::EShTargetSpv_1_6 ||
10857
builtIn != spv::BuiltIn::WorkgroupSize)
10858
builder.addDecoration(id, spv::Decoration::BuiltIn, (int)builtIn);
10859
}
10860
10861
// Add volatile decoration to HelperInvocation for spirv1.6 and beyond
10862
if (builtIn == spv::BuiltIn::HelperInvocation &&
10863
!glslangIntermediate->usingVulkanMemoryModel() &&
10864
glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_6) {
10865
builder.addDecoration(id, spv::Decoration::Volatile);
10866
}
10867
10868
// Subgroup builtins which have input storage class are volatile for ray tracing stages.
10869
if (symbol->getType().isImage() || symbol->getQualifier().isPipeInput()) {
10870
std::vector<spv::Decoration> memory;
10871
TranslateMemoryDecoration(symbol->getType().getQualifier(), memory,
10872
glslangIntermediate->usingVulkanMemoryModel());
10873
for (unsigned int i = 0; i < memory.size(); ++i)
10874
builder.addDecoration(id, memory[i]);
10875
}
10876
10877
if (builtIn == spv::BuiltIn::SampleMask) {
10878
spv::Decoration decoration;
10879
// GL_NV_sample_mask_override_coverage extension
10880
if (glslangIntermediate->getLayoutOverrideCoverage())
10881
decoration = spv::Decoration::OverrideCoverageNV;
10882
else
10883
decoration = spv::Decoration::Max;
10884
builder.addDecoration(id, decoration);
10885
if (decoration != spv::Decoration::Max) {
10886
builder.addCapability(spv::Capability::SampleMaskOverrideCoverageNV);
10887
builder.addExtension(spv::E_SPV_NV_sample_mask_override_coverage);
10888
}
10889
}
10890
else if (builtIn == spv::BuiltIn::Layer) {
10891
// SPV_NV_viewport_array2 extension
10892
if (symbol->getQualifier().layoutViewportRelative) {
10893
builder.addDecoration(id, spv::Decoration::ViewportRelativeNV);
10894
builder.addCapability(spv::Capability::ShaderViewportMaskNV);
10895
builder.addExtension(spv::E_SPV_NV_viewport_array2);
10896
}
10897
if (symbol->getQualifier().layoutSecondaryViewportRelativeOffset != -2048) {
10898
builder.addDecoration(id, spv::Decoration::SecondaryViewportRelativeNV,
10899
symbol->getQualifier().layoutSecondaryViewportRelativeOffset);
10900
builder.addCapability(spv::Capability::ShaderStereoViewNV);
10901
builder.addExtension(spv::E_SPV_NV_stereo_view_rendering);
10902
}
10903
}
10904
10905
if (symbol->getQualifier().layoutPassthrough) {
10906
builder.addDecoration(id, spv::Decoration::PassthroughNV);
10907
builder.addCapability(spv::Capability::GeometryShaderPassthroughNV);
10908
builder.addExtension(spv::E_SPV_NV_geometry_shader_passthrough);
10909
}
10910
if (symbol->getQualifier().pervertexNV) {
10911
builder.addDecoration(id, spv::Decoration::PerVertexNV);
10912
builder.addCapability(spv::Capability::FragmentBarycentricNV);
10913
builder.addExtension(spv::E_SPV_NV_fragment_shader_barycentric);
10914
}
10915
10916
if (symbol->getQualifier().pervertexEXT) {
10917
builder.addDecoration(id, spv::Decoration::PerVertexKHR);
10918
builder.addCapability(spv::Capability::FragmentBarycentricKHR);
10919
builder.addExtension(spv::E_SPV_KHR_fragment_shader_barycentric);
10920
}
10921
10922
if (glslangIntermediate->getHlslFunctionality1() && symbol->getType().getQualifier().semanticName != nullptr) {
10923
builder.addExtension("SPV_GOOGLE_hlsl_functionality1");
10924
builder.addDecoration(id, spv::Decoration::HlslSemanticGOOGLE,
10925
symbol->getType().getQualifier().semanticName);
10926
}
10927
10928
if (symbol->isReference()) {
10929
builder.addDecoration(id, symbol->getType().getQualifier().restrict ?
10930
spv::Decoration::RestrictPointerEXT : spv::Decoration::AliasedPointerEXT);
10931
}
10932
10933
// Add SPIR-V decorations (GL_EXT_spirv_intrinsics)
10934
if (symbol->getType().getQualifier().hasSpirvDecorate())
10935
applySpirvDecorate(symbol->getType(), id, {});
10936
10937
return id;
10938
}
10939
10940
// add per-primitive, per-view. per-task decorations to a struct member (member >= 0) or an object
10941
void TGlslangToSpvTraverser::addMeshNVDecoration(spv::Id id, int member, const glslang::TQualifier& qualifier)
10942
{
10943
bool isMeshShaderExt = (glslangIntermediate->getRequestedExtensions().find(glslang::E_GL_EXT_mesh_shader) !=
10944
glslangIntermediate->getRequestedExtensions().end());
10945
10946
if (member >= 0) {
10947
if (qualifier.perPrimitiveNV) {
10948
// Need to add capability/extension for fragment shader.
10949
// Mesh shader already adds this by default.
10950
if (glslangIntermediate->getStage() == EShLangFragment) {
10951
if(isMeshShaderExt) {
10952
builder.addCapability(spv::Capability::MeshShadingEXT);
10953
builder.addExtension(spv::E_SPV_EXT_mesh_shader);
10954
} else {
10955
builder.addCapability(spv::Capability::MeshShadingNV);
10956
builder.addExtension(spv::E_SPV_NV_mesh_shader);
10957
}
10958
}
10959
builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerPrimitiveNV);
10960
}
10961
if (qualifier.perViewNV)
10962
builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerViewNV);
10963
if (qualifier.perTaskNV)
10964
builder.addMemberDecoration(id, (unsigned)member, spv::Decoration::PerTaskNV);
10965
} else {
10966
if (qualifier.perPrimitiveNV) {
10967
// Need to add capability/extension for fragment shader.
10968
// Mesh shader already adds this by default.
10969
if (glslangIntermediate->getStage() == EShLangFragment) {
10970
if(isMeshShaderExt) {
10971
builder.addCapability(spv::Capability::MeshShadingEXT);
10972
builder.addExtension(spv::E_SPV_EXT_mesh_shader);
10973
} else {
10974
builder.addCapability(spv::Capability::MeshShadingNV);
10975
builder.addExtension(spv::E_SPV_NV_mesh_shader);
10976
}
10977
}
10978
builder.addDecoration(id, spv::Decoration::PerPrimitiveNV);
10979
}
10980
if (qualifier.perViewNV)
10981
builder.addDecoration(id, spv::Decoration::PerViewNV);
10982
if (qualifier.perTaskNV)
10983
builder.addDecoration(id, spv::Decoration::PerTaskNV);
10984
}
10985
}
10986
10987
bool TGlslangToSpvTraverser::hasQCOMImageProceessingDecoration(spv::Id id, spv::Decoration decor)
10988
{
10989
std::vector<spv::Decoration> &decoVec = idToQCOMDecorations[id];
10990
for ( auto d : decoVec ) {
10991
if ( d == decor )
10992
return true;
10993
}
10994
return false;
10995
}
10996
10997
void TGlslangToSpvTraverser::addImageProcessingQCOMDecoration(spv::Id id, spv::Decoration decor)
10998
{
10999
spv::Op opc = builder.getOpCode(id);
11000
if (opc == spv::Op::OpSampledImage) {
11001
id = builder.getIdOperand(id, 0);
11002
opc = builder.getOpCode(id);
11003
}
11004
11005
if (opc == spv::Op::OpLoad) {
11006
spv::Id texid = builder.getIdOperand(id, 0);
11007
if (!hasQCOMImageProceessingDecoration(texid, decor)) {//
11008
builder.addDecoration(texid, decor);
11009
idToQCOMDecorations[texid].push_back(decor);
11010
}
11011
}
11012
}
11013
11014
void TGlslangToSpvTraverser::addImageProcessing2QCOMDecoration(spv::Id id, bool isForGather)
11015
{
11016
if (isForGather) {
11017
return addImageProcessingQCOMDecoration(id, spv::Decoration::BlockMatchTextureQCOM);
11018
}
11019
11020
auto addDecor =
11021
[this](spv::Id id, spv::Decoration decor) {
11022
spv::Op tsopc = this->builder.getOpCode(id);
11023
if (tsopc == spv::Op::OpLoad) {
11024
spv::Id tsid = this->builder.getIdOperand(id, 0);
11025
if (this->glslangIntermediate->getSpv().spv >= glslang::EShTargetSpv_1_4) {
11026
assert(iOSet.count(tsid) > 0);
11027
}
11028
if (!hasQCOMImageProceessingDecoration(tsid, decor)) {
11029
this->builder.addDecoration(tsid, decor);
11030
idToQCOMDecorations[tsid].push_back(decor);
11031
}
11032
}
11033
};
11034
11035
spv::Op opc = builder.getOpCode(id);
11036
bool isInterfaceObject = (opc != spv::Op::OpSampledImage);
11037
11038
if (!isInterfaceObject) {
11039
addDecor(builder.getIdOperand(id, 0), spv::Decoration::BlockMatchTextureQCOM);
11040
addDecor(builder.getIdOperand(id, 1), spv::Decoration::BlockMatchSamplerQCOM);
11041
} else {
11042
addDecor(id, spv::Decoration::BlockMatchTextureQCOM);
11043
addDecor(id, spv::Decoration::BlockMatchSamplerQCOM);
11044
}
11045
}
11046
11047
// Make a full tree of instructions to build a SPIR-V specialization constant,
11048
// or regular constant if possible.
11049
//
11050
// TBD: this is not yet done, nor verified to be the best design, it does do the leaf symbols though
11051
//
11052
// Recursively walk the nodes. The nodes form a tree whose leaves are
11053
// regular constants, which themselves are trees that createSpvConstant()
11054
// recursively walks. So, this function walks the "top" of the tree:
11055
// - emit specialization constant-building instructions for specConstant
11056
// - when running into a non-spec-constant, switch to createSpvConstant()
11057
spv::Id TGlslangToSpvTraverser::createSpvConstant(const glslang::TIntermTyped& node)
11058
{
11059
assert(node.getQualifier().isConstant());
11060
11061
// Handle front-end constants first (non-specialization constants).
11062
if (! node.getQualifier().specConstant) {
11063
// hand off to the non-spec-constant path
11064
assert(node.getAsConstantUnion() != nullptr || node.getAsSymbolNode() != nullptr);
11065
int nextConst = 0;
11066
return createSpvConstantFromConstUnionArray(node.getType(), node.getAsConstantUnion() ?
11067
node.getAsConstantUnion()->getConstArray() : node.getAsSymbolNode()->getConstArray(),
11068
nextConst, false);
11069
}
11070
11071
// We now know we have a specialization constant to build
11072
11073
// Extra capabilities may be needed.
11074
if (node.getType().contains8BitInt())
11075
builder.addCapability(spv::Capability::Int8);
11076
if (node.getType().contains16BitFloat())
11077
builder.addCapability(spv::Capability::Float16);
11078
if (node.getType().contains16BitInt())
11079
builder.addCapability(spv::Capability::Int16);
11080
if (node.getType().contains64BitInt())
11081
builder.addCapability(spv::Capability::Int64);
11082
if (node.getType().containsDouble())
11083
builder.addCapability(spv::Capability::Float64);
11084
11085
// gl_WorkGroupSize is a special case until the front-end handles hierarchical specialization constants,
11086
// even then, it's specialization ids are handled by special case syntax in GLSL: layout(local_size_x = ...
11087
if (node.getType().getQualifier().builtIn == glslang::EbvWorkGroupSize) {
11088
std::vector<spv::Id> dimConstId;
11089
for (int dim = 0; dim < 3; ++dim) {
11090
bool specConst = (glslangIntermediate->getLocalSizeSpecId(dim) != glslang::TQualifier::layoutNotSet);
11091
dimConstId.push_back(builder.makeUintConstant(glslangIntermediate->getLocalSize(dim), specConst));
11092
if (specConst) {
11093
builder.addDecoration(dimConstId.back(), spv::Decoration::SpecId,
11094
glslangIntermediate->getLocalSizeSpecId(dim));
11095
}
11096
}
11097
return builder.makeCompositeConstant(builder.makeVectorType(builder.makeUintType(32), 3), dimConstId, true);
11098
}
11099
11100
// An AST node labelled as specialization constant should be a symbol node.
11101
// Its initializer should either be a sub tree with constant nodes, or a constant union array.
11102
if (auto* sn = node.getAsSymbolNode()) {
11103
spv::Id result;
11104
if (auto* sub_tree = sn->getConstSubtree()) {
11105
// Traverse the constant constructor sub tree like generating normal run-time instructions.
11106
// During the AST traversal, if the node is marked as 'specConstant', SpecConstantOpModeGuard
11107
// will set the builder into spec constant op instruction generating mode.
11108
sub_tree->traverse(this);
11109
result = accessChainLoad(sub_tree->getType());
11110
} else if (auto* const_union_array = &sn->getConstArray()) {
11111
int nextConst = 0;
11112
result = createSpvConstantFromConstUnionArray(sn->getType(), *const_union_array, nextConst, true);
11113
} else {
11114
logger->missingFunctionality("Invalid initializer for spec constant.");
11115
return spv::NoResult;
11116
}
11117
builder.addName(result, sn->getName().c_str());
11118
return result;
11119
}
11120
11121
// Neither a front-end constant node, nor a specialization constant node with constant union array or
11122
// constant sub tree as initializer.
11123
logger->missingFunctionality("Neither a front-end constant nor a spec constant.");
11124
return spv::NoResult;
11125
}
11126
11127
// Use 'consts' as the flattened glslang source of scalar constants to recursively
11128
// build the aggregate SPIR-V constant.
11129
//
11130
// If there are not enough elements present in 'consts', 0 will be substituted;
11131
// an empty 'consts' can be used to create a fully zeroed SPIR-V constant.
11132
//
11133
spv::Id TGlslangToSpvTraverser::createSpvConstantFromConstUnionArray(const glslang::TType& glslangType,
11134
const glslang::TConstUnionArray& consts, int& nextConst, bool specConstant)
11135
{
11136
// vector of constants for SPIR-V
11137
std::vector<spv::Id> spvConsts;
11138
11139
// Type is used for struct and array constants
11140
spv::Id typeId = convertGlslangToSpvType(glslangType);
11141
11142
if (glslangType.isArray()) {
11143
glslang::TType elementType(glslangType, 0);
11144
for (int i = 0; i < glslangType.getOuterArraySize(); ++i)
11145
spvConsts.push_back(createSpvConstantFromConstUnionArray(elementType, consts, nextConst, false));
11146
} else if (glslangType.isMatrix()) {
11147
glslang::TType vectorType(glslangType, 0);
11148
for (int col = 0; col < glslangType.getMatrixCols(); ++col)
11149
spvConsts.push_back(createSpvConstantFromConstUnionArray(vectorType, consts, nextConst, false));
11150
} else if (glslangType.isCoopMat()) {
11151
glslang::TType componentType(glslangType.getBasicType());
11152
spvConsts.push_back(createSpvConstantFromConstUnionArray(componentType, consts, nextConst, false));
11153
} else if (glslangType.isStruct()) {
11154
glslang::TVector<glslang::TTypeLoc>::const_iterator iter;
11155
for (iter = glslangType.getStruct()->begin(); iter != glslangType.getStruct()->end(); ++iter)
11156
spvConsts.push_back(createSpvConstantFromConstUnionArray(*iter->type, consts, nextConst, false));
11157
} else if (glslangType.getVectorSize() > 1 || glslangType.isCoopVecNV()) {
11158
unsigned int numComponents = glslangType.isCoopVecNV() ? glslangType.getTypeParameters()->arraySizes->getDimSize(0) : glslangType.getVectorSize();
11159
for (unsigned int i = 0; i < numComponents; ++i) {
11160
bool zero = nextConst >= consts.size();
11161
switch (glslangType.getBasicType()) {
11162
case glslang::EbtInt:
11163
spvConsts.push_back(builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst()));
11164
break;
11165
case glslang::EbtUint:
11166
spvConsts.push_back(builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst()));
11167
break;
11168
case glslang::EbtFloat:
11169
spvConsts.push_back(builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
11170
break;
11171
case glslang::EbtBool:
11172
spvConsts.push_back(builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst()));
11173
break;
11174
case glslang::EbtInt8:
11175
builder.addCapability(spv::Capability::Int8);
11176
spvConsts.push_back(builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const()));
11177
break;
11178
case glslang::EbtUint8:
11179
builder.addCapability(spv::Capability::Int8);
11180
spvConsts.push_back(builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const()));
11181
break;
11182
case glslang::EbtInt16:
11183
builder.addCapability(spv::Capability::Int16);
11184
spvConsts.push_back(builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const()));
11185
break;
11186
case glslang::EbtUint16:
11187
builder.addCapability(spv::Capability::Int16);
11188
spvConsts.push_back(builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const()));
11189
break;
11190
case glslang::EbtInt64:
11191
spvConsts.push_back(builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const()));
11192
break;
11193
case glslang::EbtUint64:
11194
spvConsts.push_back(builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const()));
11195
break;
11196
case glslang::EbtDouble:
11197
spvConsts.push_back(builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst()));
11198
break;
11199
case glslang::EbtFloat16:
11200
builder.addCapability(spv::Capability::Float16);
11201
spvConsts.push_back(builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
11202
break;
11203
case glslang::EbtBFloat16:
11204
spvConsts.push_back(builder.makeBFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
11205
break;
11206
case glslang::EbtFloatE5M2:
11207
spvConsts.push_back(builder.makeFloatE5M2Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
11208
break;
11209
case glslang::EbtFloatE4M3:
11210
spvConsts.push_back(builder.makeFloatE4M3Constant(zero ? 0.0F : (float)consts[nextConst].getDConst()));
11211
break;
11212
default:
11213
assert(0);
11214
break;
11215
}
11216
++nextConst;
11217
}
11218
} else {
11219
// we have a non-aggregate (scalar) constant
11220
bool zero = nextConst >= consts.size();
11221
spv::Id scalar = 0;
11222
switch (glslangType.getBasicType()) {
11223
case glslang::EbtInt:
11224
scalar = builder.makeIntConstant(zero ? 0 : consts[nextConst].getIConst(), specConstant);
11225
break;
11226
case glslang::EbtUint:
11227
scalar = builder.makeUintConstant(zero ? 0 : consts[nextConst].getUConst(), specConstant);
11228
break;
11229
case glslang::EbtFloat:
11230
scalar = builder.makeFloatConstant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
11231
break;
11232
case glslang::EbtBool:
11233
scalar = builder.makeBoolConstant(zero ? false : consts[nextConst].getBConst(), specConstant);
11234
break;
11235
case glslang::EbtInt8:
11236
builder.addCapability(spv::Capability::Int8);
11237
scalar = builder.makeInt8Constant(zero ? 0 : consts[nextConst].getI8Const(), specConstant);
11238
break;
11239
case glslang::EbtUint8:
11240
builder.addCapability(spv::Capability::Int8);
11241
scalar = builder.makeUint8Constant(zero ? 0 : consts[nextConst].getU8Const(), specConstant);
11242
break;
11243
case glslang::EbtInt16:
11244
builder.addCapability(spv::Capability::Int16);
11245
scalar = builder.makeInt16Constant(zero ? 0 : consts[nextConst].getI16Const(), specConstant);
11246
break;
11247
case glslang::EbtUint16:
11248
builder.addCapability(spv::Capability::Int16);
11249
scalar = builder.makeUint16Constant(zero ? 0 : consts[nextConst].getU16Const(), specConstant);
11250
break;
11251
case glslang::EbtInt64:
11252
scalar = builder.makeInt64Constant(zero ? 0 : consts[nextConst].getI64Const(), specConstant);
11253
break;
11254
case glslang::EbtUint64:
11255
scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);
11256
break;
11257
case glslang::EbtDouble:
11258
scalar = builder.makeDoubleConstant(zero ? 0.0 : consts[nextConst].getDConst(), specConstant);
11259
break;
11260
case glslang::EbtFloat16:
11261
builder.addCapability(spv::Capability::Float16);
11262
scalar = builder.makeFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
11263
break;
11264
case glslang::EbtBFloat16:
11265
scalar = builder.makeBFloat16Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
11266
break;
11267
case glslang::EbtFloatE5M2:
11268
scalar = builder.makeFloatE5M2Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
11269
break;
11270
case glslang::EbtFloatE4M3:
11271
scalar = builder.makeFloatE4M3Constant(zero ? 0.0F : (float)consts[nextConst].getDConst(), specConstant);
11272
break;
11273
case glslang::EbtReference:
11274
scalar = builder.makeUint64Constant(zero ? 0 : consts[nextConst].getU64Const(), specConstant);
11275
scalar = builder.createUnaryOp(spv::Op::OpBitcast, typeId, scalar);
11276
break;
11277
case glslang::EbtString:
11278
scalar = builder.getStringId(consts[nextConst].getSConst()->c_str());
11279
break;
11280
default:
11281
assert(0);
11282
break;
11283
}
11284
++nextConst;
11285
return scalar;
11286
}
11287
11288
return builder.makeCompositeConstant(typeId, spvConsts);
11289
}
11290
11291
// Return true if the node is a constant or symbol whose reading has no
11292
// non-trivial observable cost or effect.
11293
bool TGlslangToSpvTraverser::isTrivialLeaf(const glslang::TIntermTyped* node)
11294
{
11295
// don't know what this is
11296
if (node == nullptr)
11297
return false;
11298
11299
// a constant is safe
11300
if (node->getAsConstantUnion() != nullptr)
11301
return true;
11302
11303
// not a symbol means non-trivial
11304
if (node->getAsSymbolNode() == nullptr)
11305
return false;
11306
11307
// a symbol, depends on what's being read
11308
switch (node->getType().getQualifier().storage) {
11309
case glslang::EvqTemporary:
11310
case glslang::EvqGlobal:
11311
case glslang::EvqIn:
11312
case glslang::EvqInOut:
11313
case glslang::EvqConst:
11314
case glslang::EvqConstReadOnly:
11315
case glslang::EvqUniform:
11316
return true;
11317
default:
11318
return false;
11319
}
11320
}
11321
11322
// A node is trivial if it is a single operation with no side effects.
11323
// HLSL (and/or vectors) are always trivial, as it does not short circuit.
11324
// Otherwise, error on the side of saying non-trivial.
11325
// Return true if trivial.
11326
bool TGlslangToSpvTraverser::isTrivial(const glslang::TIntermTyped* node)
11327
{
11328
if (node == nullptr)
11329
return false;
11330
11331
// count non scalars as trivial, as well as anything coming from HLSL
11332
if (! node->getType().isScalarOrVec1() || glslangIntermediate->getSource() == glslang::EShSourceHlsl)
11333
return true;
11334
11335
// symbols and constants are trivial
11336
if (isTrivialLeaf(node))
11337
return true;
11338
11339
// otherwise, it needs to be a simple operation or one or two leaf nodes
11340
11341
// not a simple operation
11342
const glslang::TIntermBinary* binaryNode = node->getAsBinaryNode();
11343
const glslang::TIntermUnary* unaryNode = node->getAsUnaryNode();
11344
if (binaryNode == nullptr && unaryNode == nullptr)
11345
return false;
11346
11347
// not on leaf nodes
11348
if (binaryNode && (! isTrivialLeaf(binaryNode->getLeft()) || ! isTrivialLeaf(binaryNode->getRight())))
11349
return false;
11350
11351
if (unaryNode && ! isTrivialLeaf(unaryNode->getOperand())) {
11352
return false;
11353
}
11354
11355
if (IsOpNumericConv(node->getAsOperator()->getOp()) &&
11356
node->getType().getBasicType() == glslang::EbtBool) {
11357
return true;
11358
}
11359
11360
switch (node->getAsOperator()->getOp()) {
11361
case glslang::EOpLogicalNot:
11362
case glslang::EOpEqual:
11363
case glslang::EOpNotEqual:
11364
case glslang::EOpLessThan:
11365
case glslang::EOpGreaterThan:
11366
case glslang::EOpLessThanEqual:
11367
case glslang::EOpGreaterThanEqual:
11368
case glslang::EOpIndexDirect:
11369
case glslang::EOpIndexDirectStruct:
11370
case glslang::EOpLogicalXor:
11371
case glslang::EOpAny:
11372
case glslang::EOpAll:
11373
return true;
11374
default:
11375
return false;
11376
}
11377
}
11378
11379
// Emit short-circuiting code, where 'right' is never evaluated unless
11380
// the left side is true (for &&) or false (for ||).
11381
spv::Id TGlslangToSpvTraverser::createShortCircuit(glslang::TOperator op, glslang::TIntermTyped& left,
11382
glslang::TIntermTyped& right)
11383
{
11384
spv::Id boolTypeId = builder.makeBoolType();
11385
11386
// emit left operand
11387
builder.clearAccessChain();
11388
left.traverse(this);
11389
spv::Id leftId = accessChainLoad(left.getType());
11390
11391
// Operands to accumulate OpPhi operands
11392
std::vector<spv::Id> phiOperands;
11393
phiOperands.reserve(4);
11394
// accumulate left operand's phi information
11395
phiOperands.push_back(leftId);
11396
phiOperands.push_back(builder.getBuildPoint()->getId());
11397
11398
// Make the two kinds of operation symmetric with a "!"
11399
// || => emit "if (! left) result = right"
11400
// && => emit "if ( left) result = right"
11401
//
11402
// TODO: this runtime "not" for || could be avoided by adding functionality
11403
// to 'builder' to have an "else" without an "then"
11404
if (op == glslang::EOpLogicalOr)
11405
leftId = builder.createUnaryOp(spv::Op::OpLogicalNot, boolTypeId, leftId);
11406
11407
// make an "if" based on the left value
11408
spv::Builder::If ifBuilder(leftId, spv::SelectionControlMask::MaskNone, builder);
11409
11410
// emit right operand as the "then" part of the "if"
11411
builder.clearAccessChain();
11412
right.traverse(this);
11413
spv::Id rightId = accessChainLoad(right.getType());
11414
11415
// accumulate left operand's phi information
11416
phiOperands.push_back(rightId);
11417
phiOperands.push_back(builder.getBuildPoint()->getId());
11418
11419
// finish the "if"
11420
ifBuilder.makeEndIf();
11421
11422
// phi together the two results
11423
return builder.createOp(spv::Op::OpPhi, boolTypeId, phiOperands);
11424
}
11425
11426
// Return type Id of the imported set of extended instructions corresponds to the name.
11427
// Import this set if it has not been imported yet.
11428
spv::Id TGlslangToSpvTraverser::getExtBuiltins(const char* name)
11429
{
11430
if (extBuiltinMap.find(name) != extBuiltinMap.end())
11431
return extBuiltinMap[name];
11432
else {
11433
spv::Id extBuiltins = builder.import(name);
11434
extBuiltinMap[name] = extBuiltins;
11435
return extBuiltins;
11436
}
11437
}
11438
11439
} // end anonymous namespace
11440
11441
namespace glslang {
11442
11443
void GetSpirvVersion(std::string& version)
11444
{
11445
const int bufSize = 100;
11446
char buf[bufSize];
11447
snprintf(buf, bufSize, "0x%08x, Revision %d", spv::Version, spv::Revision);
11448
version = buf;
11449
}
11450
11451
// For low-order part of the generator's magic number. Bump up
11452
// when there is a change in the style (e.g., if SSA form changes,
11453
// or a different instruction sequence to do something gets used).
11454
int GetSpirvGeneratorVersion()
11455
{
11456
// return 1; // start
11457
// return 2; // EOpAtomicCounterDecrement gets a post decrement, to map between GLSL -> SPIR-V
11458
// return 3; // change/correct barrier-instruction operands, to match memory model group decisions
11459
// return 4; // some deeper access chains: for dynamic vector component, and local Boolean component
11460
// return 5; // make OpArrayLength result type be an int with signedness of 0
11461
// return 6; // revert version 5 change, which makes a different (new) kind of incorrect code,
11462
// versions 4 and 6 each generate OpArrayLength as it has long been done
11463
// return 7; // GLSL volatile keyword maps to both SPIR-V decorations Volatile and Coherent
11464
// return 8; // switch to new dead block eliminator; use OpUnreachable
11465
// return 9; // don't include opaque function parameters in OpEntryPoint global's operand list
11466
// return 10; // Generate OpFUnordNotEqual for != comparisons
11467
return 11; // Make OpEmitMeshTasksEXT a terminal instruction
11468
}
11469
11470
// Write SPIR-V out to a binary file
11471
bool OutputSpvBin(const std::vector<unsigned int>& spirv, const char* baseName)
11472
{
11473
std::ofstream out;
11474
out.open(baseName, std::ios::binary | std::ios::out);
11475
if (out.fail()) {
11476
printf("ERROR: Failed to open file: %s\n", baseName);
11477
return false;
11478
}
11479
for (int i = 0; i < (int)spirv.size(); ++i) {
11480
unsigned int word = spirv[i];
11481
out.write((const char*)&word, 4);
11482
}
11483
out.close();
11484
return true;
11485
}
11486
11487
// Write SPIR-V out to a text file with 32-bit hexadecimal words
11488
bool OutputSpvHex(const std::vector<unsigned int>& spirv, const char* baseName, const char* varName)
11489
{
11490
std::ofstream out;
11491
out.open(baseName, std::ios::binary | std::ios::out);
11492
if (out.fail()) {
11493
printf("ERROR: Failed to open file: %s\n", baseName);
11494
return false;
11495
}
11496
out << "\t// " <<
11497
GetSpirvGeneratorVersion() <<
11498
GLSLANG_VERSION_MAJOR << "." << GLSLANG_VERSION_MINOR << "." << GLSLANG_VERSION_PATCH <<
11499
GLSLANG_VERSION_FLAVOR << std::endl;
11500
if (varName != nullptr) {
11501
out << "\t #pragma once" << std::endl;
11502
out << "const uint32_t " << varName << "[] = {" << std::endl;
11503
}
11504
const int WORDS_PER_LINE = 8;
11505
for (int i = 0; i < (int)spirv.size(); i += WORDS_PER_LINE) {
11506
out << "\t";
11507
for (int j = 0; j < WORDS_PER_LINE && i + j < (int)spirv.size(); ++j) {
11508
const unsigned int word = spirv[i + j];
11509
out << "0x" << std::hex << std::setw(8) << std::setfill('0') << word;
11510
if (i + j + 1 < (int)spirv.size()) {
11511
out << ",";
11512
}
11513
}
11514
out << std::endl;
11515
}
11516
if (varName != nullptr) {
11517
out << "};";
11518
out << std::endl;
11519
}
11520
out.close();
11521
return true;
11522
}
11523
11524
//
11525
// Set up the glslang traversal
11526
//
11527
void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv, SpvOptions* options)
11528
{
11529
spv::SpvBuildLogger logger;
11530
GlslangToSpv(intermediate, spirv, &logger, options);
11531
}
11532
11533
void GlslangToSpv(const TIntermediate& intermediate, std::vector<unsigned int>& spirv,
11534
spv::SpvBuildLogger* logger, SpvOptions* options)
11535
{
11536
TIntermNode* root = intermediate.getTreeRoot();
11537
11538
if (root == nullptr)
11539
return;
11540
11541
SpvOptions defaultOptions;
11542
if (options == nullptr)
11543
options = &defaultOptions;
11544
11545
GetThreadPoolAllocator().push();
11546
11547
TGlslangToSpvTraverser it(intermediate.getSpv().spv, &intermediate, logger, *options);
11548
root->traverse(&it);
11549
it.finishSpv(options->compileOnly);
11550
it.dumpSpv(spirv);
11551
11552
#if ENABLE_OPT
11553
// If from HLSL, run spirv-opt to "legalize" the SPIR-V for Vulkan
11554
// eg. forward and remove memory writes of opaque types.
11555
bool prelegalization = intermediate.getSource() == EShSourceHlsl;
11556
if ((prelegalization || options->optimizeSize) && !options->disableOptimizer) {
11557
SpirvToolsTransform(intermediate, spirv, logger, options);
11558
prelegalization = false;
11559
}
11560
else if (options->stripDebugInfo) {
11561
// Strip debug info even if optimization is disabled.
11562
SpirvToolsStripDebugInfo(intermediate, spirv, logger);
11563
}
11564
11565
if (options->validate)
11566
SpirvToolsValidate(intermediate, spirv, logger, prelegalization);
11567
11568
if (options->disassemble)
11569
SpirvToolsDisassemble(std::cout, spirv);
11570
11571
#endif
11572
11573
GetThreadPoolAllocator().pop();
11574
}
11575
11576
} // end namespace glslang
11577
11578