Book a Demo!
CoCalc Logo Icon
StoreFeaturesDocsShareSupportNewsAboutPoliciesSign UpSign In
freebsd
GitHub Repository: freebsd/freebsd-src
Path: blob/main/contrib/llvm-project/llvm/lib/Target/NVPTX/NVPTXSubtarget.h
35271 views
1
//=====-- NVPTXSubtarget.h - Define Subtarget for the NVPTX ---*- C++ -*--====//
2
//
3
// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4
// See https://llvm.org/LICENSE.txt for license information.
5
// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6
//
7
//===----------------------------------------------------------------------===//
8
//
9
// This file declares the NVPTX specific subclass of TargetSubtarget.
10
//
11
//===----------------------------------------------------------------------===//
12
13
#ifndef LLVM_LIB_TARGET_NVPTX_NVPTXSUBTARGET_H
14
#define LLVM_LIB_TARGET_NVPTX_NVPTXSUBTARGET_H
15
16
#include "NVPTX.h"
17
#include "NVPTXFrameLowering.h"
18
#include "NVPTXISelLowering.h"
19
#include "NVPTXInstrInfo.h"
20
#include "NVPTXRegisterInfo.h"
21
#include "llvm/CodeGen/SelectionDAGTargetInfo.h"
22
#include "llvm/CodeGen/TargetSubtargetInfo.h"
23
#include "llvm/IR/DataLayout.h"
24
#include <string>
25
26
#define GET_SUBTARGETINFO_HEADER
27
#include "NVPTXGenSubtargetInfo.inc"
28
29
namespace llvm {
30
31
class NVPTXSubtarget : public NVPTXGenSubtargetInfo {
32
virtual void anchor();
33
std::string TargetName;
34
35
// PTX version x.y is represented as 10*x+y, e.g. 3.1 == 31
36
unsigned PTXVersion;
37
38
// Full SM version x.y is represented as 100*x+10*y+feature, e.g. 3.1 == 310
39
// sm_90a == 901
40
unsigned int FullSmVersion;
41
42
// SM version x.y is represented as 10*x+y, e.g. 3.1 == 31. Derived from
43
// FullSmVersion.
44
unsigned int SmVersion;
45
46
const NVPTXTargetMachine &TM;
47
NVPTXInstrInfo InstrInfo;
48
NVPTXTargetLowering TLInfo;
49
SelectionDAGTargetInfo TSInfo;
50
51
// NVPTX does not have any call stack frame, but need a NVPTX specific
52
// FrameLowering class because TargetFrameLowering is abstract.
53
NVPTXFrameLowering FrameLowering;
54
55
public:
56
/// This constructor initializes the data members to match that
57
/// of the specified module.
58
///
59
NVPTXSubtarget(const Triple &TT, const std::string &CPU,
60
const std::string &FS, const NVPTXTargetMachine &TM);
61
62
const TargetFrameLowering *getFrameLowering() const override {
63
return &FrameLowering;
64
}
65
const NVPTXInstrInfo *getInstrInfo() const override { return &InstrInfo; }
66
const NVPTXRegisterInfo *getRegisterInfo() const override {
67
return &InstrInfo.getRegisterInfo();
68
}
69
const NVPTXTargetLowering *getTargetLowering() const override {
70
return &TLInfo;
71
}
72
const SelectionDAGTargetInfo *getSelectionDAGInfo() const override {
73
return &TSInfo;
74
}
75
76
bool hasAtomAddF64() const { return SmVersion >= 60; }
77
bool hasAtomScope() const { return SmVersion >= 60; }
78
bool hasAtomBitwise64() const { return SmVersion >= 32; }
79
bool hasAtomMinMax64() const { return SmVersion >= 32; }
80
bool hasLDG() const { return SmVersion >= 32; }
81
inline bool hasHWROT32() const { return SmVersion >= 32; }
82
bool hasImageHandles() const;
83
bool hasFP16Math() const { return SmVersion >= 53; }
84
bool hasBF16Math() const { return SmVersion >= 80; }
85
bool allowFP16Math() const;
86
bool hasMaskOperator() const { return PTXVersion >= 71; }
87
bool hasNoReturn() const { return SmVersion >= 30 && PTXVersion >= 64; }
88
unsigned int getFullSmVersion() const { return FullSmVersion; }
89
unsigned int getSmVersion() const { return getFullSmVersion() / 10; }
90
// GPUs with "a" suffix have include architecture-accelerated features that
91
// are supported on the specified architecture only, hence such targets do not
92
// follow the onion layer model. hasAAFeatures() allows distinguishing such
93
// GPU variants from the base GPU architecture.
94
// - 0 represents base GPU model,
95
// - non-zero value identifies particular architecture-accelerated variant.
96
bool hasAAFeatures() const { return getFullSmVersion() % 10; }
97
std::string getTargetName() const { return TargetName; }
98
99
// Get maximum value of required alignments among the supported data types.
100
// From the PTX ISA doc, section 8.2.3:
101
// The memory consistency model relates operations executed on memory
102
// locations with scalar data-types, which have a maximum size and alignment
103
// of 64 bits. Memory operations with a vector data-type are modelled as a
104
// set of equivalent memory operations with a scalar data-type, executed in
105
// an unspecified order on the elements in the vector.
106
unsigned getMaxRequiredAlignment() const { return 8; }
107
108
unsigned getPTXVersion() const { return PTXVersion; }
109
110
NVPTXSubtarget &initializeSubtargetDependencies(StringRef CPU, StringRef FS);
111
void ParseSubtargetFeatures(StringRef CPU, StringRef TuneCPU, StringRef FS);
112
};
113
114
} // End llvm namespace
115
116
#endif
117
118