Path: blob/main/contrib/llvm-project/llvm/lib/TargetParser/TargetParser.cpp
35234 views
//===-- TargetParser - Parser for target features ---------------*- C++ -*-===//1//2// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.3// See https://llvm.org/LICENSE.txt for license information.4// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception5//6//===----------------------------------------------------------------------===//7//8// This file implements a target parser to recognise hardware features such as9// FPU/CPU/ARCH names as well as specific support such as HDIV, etc.10//11//===----------------------------------------------------------------------===//1213#include "llvm/TargetParser/TargetParser.h"14#include "llvm/ADT/ArrayRef.h"15#include "llvm/TargetParser/Triple.h"1617using namespace llvm;18using namespace AMDGPU;1920namespace {2122struct GPUInfo {23StringLiteral Name;24StringLiteral CanonicalName;25AMDGPU::GPUKind Kind;26unsigned Features;27};2829constexpr GPUInfo R600GPUs[] = {30// Name Canonical Kind Features31// Name32{{"r600"}, {"r600"}, GK_R600, FEATURE_NONE },33{{"rv630"}, {"r600"}, GK_R600, FEATURE_NONE },34{{"rv635"}, {"r600"}, GK_R600, FEATURE_NONE },35{{"r630"}, {"r630"}, GK_R630, FEATURE_NONE },36{{"rs780"}, {"rs880"}, GK_RS880, FEATURE_NONE },37{{"rs880"}, {"rs880"}, GK_RS880, FEATURE_NONE },38{{"rv610"}, {"rs880"}, GK_RS880, FEATURE_NONE },39{{"rv620"}, {"rs880"}, GK_RS880, FEATURE_NONE },40{{"rv670"}, {"rv670"}, GK_RV670, FEATURE_NONE },41{{"rv710"}, {"rv710"}, GK_RV710, FEATURE_NONE },42{{"rv730"}, {"rv730"}, GK_RV730, FEATURE_NONE },43{{"rv740"}, {"rv770"}, GK_RV770, FEATURE_NONE },44{{"rv770"}, {"rv770"}, GK_RV770, FEATURE_NONE },45{{"cedar"}, {"cedar"}, GK_CEDAR, FEATURE_NONE },46{{"palm"}, {"cedar"}, GK_CEDAR, FEATURE_NONE },47{{"cypress"}, {"cypress"}, GK_CYPRESS, FEATURE_FMA },48{{"hemlock"}, {"cypress"}, GK_CYPRESS, FEATURE_FMA },49{{"juniper"}, {"juniper"}, GK_JUNIPER, FEATURE_NONE },50{{"redwood"}, {"redwood"}, GK_REDWOOD, FEATURE_NONE },51{{"sumo"}, {"sumo"}, GK_SUMO, FEATURE_NONE },52{{"sumo2"}, {"sumo"}, GK_SUMO, FEATURE_NONE },53{{"barts"}, {"barts"}, GK_BARTS, FEATURE_NONE },54{{"caicos"}, {"caicos"}, GK_CAICOS, FEATURE_NONE },55{{"aruba"}, {"cayman"}, GK_CAYMAN, FEATURE_FMA },56{{"cayman"}, {"cayman"}, GK_CAYMAN, FEATURE_FMA },57{{"turks"}, {"turks"}, GK_TURKS, FEATURE_NONE }58};5960// This table should be sorted by the value of GPUKind61// Don't bother listing the implicitly true features62constexpr GPUInfo AMDGCNGPUs[] = {63// clang-format off64// Name Canonical Kind Features65// Name66{{"gfx600"}, {"gfx600"}, GK_GFX600, FEATURE_FAST_FMA_F32},67{{"tahiti"}, {"gfx600"}, GK_GFX600, FEATURE_FAST_FMA_F32},68{{"gfx601"}, {"gfx601"}, GK_GFX601, FEATURE_NONE},69{{"pitcairn"}, {"gfx601"}, GK_GFX601, FEATURE_NONE},70{{"verde"}, {"gfx601"}, GK_GFX601, FEATURE_NONE},71{{"gfx602"}, {"gfx602"}, GK_GFX602, FEATURE_NONE},72{{"hainan"}, {"gfx602"}, GK_GFX602, FEATURE_NONE},73{{"oland"}, {"gfx602"}, GK_GFX602, FEATURE_NONE},74{{"gfx700"}, {"gfx700"}, GK_GFX700, FEATURE_NONE},75{{"kaveri"}, {"gfx700"}, GK_GFX700, FEATURE_NONE},76{{"gfx701"}, {"gfx701"}, GK_GFX701, FEATURE_FAST_FMA_F32},77{{"hawaii"}, {"gfx701"}, GK_GFX701, FEATURE_FAST_FMA_F32},78{{"gfx702"}, {"gfx702"}, GK_GFX702, FEATURE_FAST_FMA_F32},79{{"gfx703"}, {"gfx703"}, GK_GFX703, FEATURE_NONE},80{{"kabini"}, {"gfx703"}, GK_GFX703, FEATURE_NONE},81{{"mullins"}, {"gfx703"}, GK_GFX703, FEATURE_NONE},82{{"gfx704"}, {"gfx704"}, GK_GFX704, FEATURE_NONE},83{{"bonaire"}, {"gfx704"}, GK_GFX704, FEATURE_NONE},84{{"gfx705"}, {"gfx705"}, GK_GFX705, FEATURE_NONE},85{{"gfx801"}, {"gfx801"}, GK_GFX801, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},86{{"carrizo"}, {"gfx801"}, GK_GFX801, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},87{{"gfx802"}, {"gfx802"}, GK_GFX802, FEATURE_FAST_DENORMAL_F32},88{{"iceland"}, {"gfx802"}, GK_GFX802, FEATURE_FAST_DENORMAL_F32},89{{"tonga"}, {"gfx802"}, GK_GFX802, FEATURE_FAST_DENORMAL_F32},90{{"gfx803"}, {"gfx803"}, GK_GFX803, FEATURE_FAST_DENORMAL_F32},91{{"fiji"}, {"gfx803"}, GK_GFX803, FEATURE_FAST_DENORMAL_F32},92{{"polaris10"}, {"gfx803"}, GK_GFX803, FEATURE_FAST_DENORMAL_F32},93{{"polaris11"}, {"gfx803"}, GK_GFX803, FEATURE_FAST_DENORMAL_F32},94{{"gfx805"}, {"gfx805"}, GK_GFX805, FEATURE_FAST_DENORMAL_F32},95{{"tongapro"}, {"gfx805"}, GK_GFX805, FEATURE_FAST_DENORMAL_F32},96{{"gfx810"}, {"gfx810"}, GK_GFX810, FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},97{{"stoney"}, {"gfx810"}, GK_GFX810, FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},98{{"gfx900"}, {"gfx900"}, GK_GFX900, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},99{{"gfx902"}, {"gfx902"}, GK_GFX902, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},100{{"gfx904"}, {"gfx904"}, GK_GFX904, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},101{{"gfx906"}, {"gfx906"}, GK_GFX906, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},102{{"gfx908"}, {"gfx908"}, GK_GFX908, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},103{{"gfx909"}, {"gfx909"}, GK_GFX909, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},104{{"gfx90a"}, {"gfx90a"}, GK_GFX90A, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},105{{"gfx90c"}, {"gfx90c"}, GK_GFX90C, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},106{{"gfx940"}, {"gfx940"}, GK_GFX940, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},107{{"gfx941"}, {"gfx941"}, GK_GFX941, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},108{{"gfx942"}, {"gfx942"}, GK_GFX942, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC},109{{"gfx1010"}, {"gfx1010"}, GK_GFX1010, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},110{{"gfx1011"}, {"gfx1011"}, GK_GFX1011, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},111{{"gfx1012"}, {"gfx1012"}, GK_GFX1012, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},112{{"gfx1013"}, {"gfx1013"}, GK_GFX1013, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},113{{"gfx1030"}, {"gfx1030"}, GK_GFX1030, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},114{{"gfx1031"}, {"gfx1031"}, GK_GFX1031, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},115{{"gfx1032"}, {"gfx1032"}, GK_GFX1032, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},116{{"gfx1033"}, {"gfx1033"}, GK_GFX1033, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},117{{"gfx1034"}, {"gfx1034"}, GK_GFX1034, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},118{{"gfx1035"}, {"gfx1035"}, GK_GFX1035, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},119{{"gfx1036"}, {"gfx1036"}, GK_GFX1036, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},120{{"gfx1100"}, {"gfx1100"}, GK_GFX1100, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},121{{"gfx1101"}, {"gfx1101"}, GK_GFX1101, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},122{{"gfx1102"}, {"gfx1102"}, GK_GFX1102, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},123{{"gfx1103"}, {"gfx1103"}, GK_GFX1103, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},124{{"gfx1150"}, {"gfx1150"}, GK_GFX1150, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},125{{"gfx1151"}, {"gfx1151"}, GK_GFX1151, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},126{{"gfx1152"}, {"gfx1152"}, GK_GFX1152, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},127{{"gfx1200"}, {"gfx1200"}, GK_GFX1200, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},128{{"gfx1201"}, {"gfx1201"}, GK_GFX1201, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},129130{{"gfx9-generic"}, {"gfx9-generic"}, GK_GFX9_GENERIC, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK},131{{"gfx10-1-generic"}, {"gfx10-1-generic"}, GK_GFX10_1_GENERIC, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP},132{{"gfx10-3-generic"}, {"gfx10-3-generic"}, GK_GFX10_3_GENERIC, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},133{{"gfx11-generic"}, {"gfx11-generic"}, GK_GFX11_GENERIC, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},134{{"gfx12-generic"}, {"gfx12-generic"}, GK_GFX12_GENERIC, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP},135// clang-format on136};137138const GPUInfo *getArchEntry(AMDGPU::GPUKind AK, ArrayRef<GPUInfo> Table) {139GPUInfo Search = { {""}, {""}, AK, AMDGPU::FEATURE_NONE };140141auto I =142llvm::lower_bound(Table, Search, [](const GPUInfo &A, const GPUInfo &B) {143return A.Kind < B.Kind;144});145146if (I == Table.end() || I->Kind != Search.Kind)147return nullptr;148return I;149}150151} // namespace152153StringRef llvm::AMDGPU::getArchFamilyNameAMDGCN(GPUKind AK) {154switch (AK) {155case AMDGPU::GK_GFX9_GENERIC:156return "gfx9";157case AMDGPU::GK_GFX10_1_GENERIC:158case AMDGPU::GK_GFX10_3_GENERIC:159return "gfx10";160case AMDGPU::GK_GFX11_GENERIC:161return "gfx11";162case AMDGPU::GK_GFX12_GENERIC:163return "gfx12";164default: {165StringRef ArchName = getArchNameAMDGCN(AK);166return ArchName.empty() ? "" : ArchName.drop_back(2);167}168}169}170171StringRef llvm::AMDGPU::getArchNameAMDGCN(GPUKind AK) {172if (const auto *Entry = getArchEntry(AK, AMDGCNGPUs))173return Entry->CanonicalName;174return "";175}176177StringRef llvm::AMDGPU::getArchNameR600(GPUKind AK) {178if (const auto *Entry = getArchEntry(AK, R600GPUs))179return Entry->CanonicalName;180return "";181}182183AMDGPU::GPUKind llvm::AMDGPU::parseArchAMDGCN(StringRef CPU) {184for (const auto &C : AMDGCNGPUs) {185if (CPU == C.Name)186return C.Kind;187}188189return AMDGPU::GPUKind::GK_NONE;190}191192AMDGPU::GPUKind llvm::AMDGPU::parseArchR600(StringRef CPU) {193for (const auto &C : R600GPUs) {194if (CPU == C.Name)195return C.Kind;196}197198return AMDGPU::GPUKind::GK_NONE;199}200201unsigned AMDGPU::getArchAttrAMDGCN(GPUKind AK) {202if (const auto *Entry = getArchEntry(AK, AMDGCNGPUs))203return Entry->Features;204return FEATURE_NONE;205}206207unsigned AMDGPU::getArchAttrR600(GPUKind AK) {208if (const auto *Entry = getArchEntry(AK, R600GPUs))209return Entry->Features;210return FEATURE_NONE;211}212213void AMDGPU::fillValidArchListAMDGCN(SmallVectorImpl<StringRef> &Values) {214// XXX: Should this only report unique canonical names?215for (const auto &C : AMDGCNGPUs)216Values.push_back(C.Name);217}218219void AMDGPU::fillValidArchListR600(SmallVectorImpl<StringRef> &Values) {220for (const auto &C : R600GPUs)221Values.push_back(C.Name);222}223224AMDGPU::IsaVersion AMDGPU::getIsaVersion(StringRef GPU) {225AMDGPU::GPUKind AK = parseArchAMDGCN(GPU);226if (AK == AMDGPU::GPUKind::GK_NONE) {227if (GPU == "generic-hsa")228return {7, 0, 0};229if (GPU == "generic")230return {6, 0, 0};231return {0, 0, 0};232}233234// clang-format off235switch (AK) {236case GK_GFX600: return {6, 0, 0};237case GK_GFX601: return {6, 0, 1};238case GK_GFX602: return {6, 0, 2};239case GK_GFX700: return {7, 0, 0};240case GK_GFX701: return {7, 0, 1};241case GK_GFX702: return {7, 0, 2};242case GK_GFX703: return {7, 0, 3};243case GK_GFX704: return {7, 0, 4};244case GK_GFX705: return {7, 0, 5};245case GK_GFX801: return {8, 0, 1};246case GK_GFX802: return {8, 0, 2};247case GK_GFX803: return {8, 0, 3};248case GK_GFX805: return {8, 0, 5};249case GK_GFX810: return {8, 1, 0};250case GK_GFX900: return {9, 0, 0};251case GK_GFX902: return {9, 0, 2};252case GK_GFX904: return {9, 0, 4};253case GK_GFX906: return {9, 0, 6};254case GK_GFX908: return {9, 0, 8};255case GK_GFX909: return {9, 0, 9};256case GK_GFX90A: return {9, 0, 10};257case GK_GFX90C: return {9, 0, 12};258case GK_GFX940: return {9, 4, 0};259case GK_GFX941: return {9, 4, 1};260case GK_GFX942: return {9, 4, 2};261case GK_GFX1010: return {10, 1, 0};262case GK_GFX1011: return {10, 1, 1};263case GK_GFX1012: return {10, 1, 2};264case GK_GFX1013: return {10, 1, 3};265case GK_GFX1030: return {10, 3, 0};266case GK_GFX1031: return {10, 3, 1};267case GK_GFX1032: return {10, 3, 2};268case GK_GFX1033: return {10, 3, 3};269case GK_GFX1034: return {10, 3, 4};270case GK_GFX1035: return {10, 3, 5};271case GK_GFX1036: return {10, 3, 6};272case GK_GFX1100: return {11, 0, 0};273case GK_GFX1101: return {11, 0, 1};274case GK_GFX1102: return {11, 0, 2};275case GK_GFX1103: return {11, 0, 3};276case GK_GFX1150: return {11, 5, 0};277case GK_GFX1151: return {11, 5, 1};278case GK_GFX1152: return {11, 5, 2};279case GK_GFX1200: return {12, 0, 0};280case GK_GFX1201: return {12, 0, 1};281282// Generic targets return the lowest common denominator283// within their family. That is, the ISA that is the most284// restricted in terms of features.285//286// gfx9-generic is tricky because there is no lowest287// common denominator, so we return gfx900 which has mad-mix288// but this family doesn't have it.289//290// This API should never be used to check for a particular291// feature anyway.292//293// TODO: Split up this API depending on its caller so294// generic target handling is more obvious and less risky.295case GK_GFX9_GENERIC: return {9, 0, 0};296case GK_GFX10_1_GENERIC: return {10, 1, 0};297case GK_GFX10_3_GENERIC: return {10, 3, 0};298case GK_GFX11_GENERIC: return {11, 0, 3};299case GK_GFX12_GENERIC: return {12, 0, 0};300default: return {0, 0, 0};301}302// clang-format on303}304305StringRef AMDGPU::getCanonicalArchName(const Triple &T, StringRef Arch) {306assert(T.isAMDGPU());307auto ProcKind = T.isAMDGCN() ? parseArchAMDGCN(Arch) : parseArchR600(Arch);308if (ProcKind == GK_NONE)309return StringRef();310311return T.isAMDGCN() ? getArchNameAMDGCN(ProcKind) : getArchNameR600(ProcKind);312}313314void AMDGPU::fillAMDGPUFeatureMap(StringRef GPU, const Triple &T,315StringMap<bool> &Features) {316// XXX - What does the member GPU mean if device name string passed here?317if (T.isSPIRV() && T.getOS() == Triple::OSType::AMDHSA) {318// AMDGCN SPIRV must support the union of all AMDGCN features.319Features["atomic-ds-pk-add-16-insts"] = true;320Features["atomic-flat-pk-add-16-insts"] = true;321Features["atomic-buffer-global-pk-add-f16-insts"] = true;322Features["atomic-global-pk-add-bf16-inst"] = true;323Features["atomic-fadd-rtn-insts"] = true;324Features["ci-insts"] = true;325Features["dot1-insts"] = true;326Features["dot2-insts"] = true;327Features["dot3-insts"] = true;328Features["dot4-insts"] = true;329Features["dot5-insts"] = true;330Features["dot7-insts"] = true;331Features["dot8-insts"] = true;332Features["dot9-insts"] = true;333Features["dot10-insts"] = true;334Features["dot11-insts"] = true;335Features["dl-insts"] = true;336Features["16-bit-insts"] = true;337Features["dpp"] = true;338Features["gfx8-insts"] = true;339Features["gfx9-insts"] = true;340Features["gfx90a-insts"] = true;341Features["gfx940-insts"] = true;342Features["gfx10-insts"] = true;343Features["gfx10-3-insts"] = true;344Features["gfx11-insts"] = true;345Features["gfx12-insts"] = true;346Features["image-insts"] = true;347Features["fp8-conversion-insts"] = true;348Features["s-memrealtime"] = true;349Features["s-memtime-inst"] = true;350Features["gws"] = true;351Features["fp8-insts"] = true;352Features["fp8-conversion-insts"] = true;353Features["atomic-ds-pk-add-16-insts"] = true;354Features["mai-insts"] = true;355Features["wavefrontsize32"] = true;356Features["wavefrontsize64"] = true;357} else if (T.isAMDGCN()) {358switch (parseArchAMDGCN(GPU)) {359case GK_GFX1201:360case GK_GFX1200:361case GK_GFX12_GENERIC:362Features["ci-insts"] = true;363Features["dot7-insts"] = true;364Features["dot8-insts"] = true;365Features["dot9-insts"] = true;366Features["dot10-insts"] = true;367Features["dot11-insts"] = true;368Features["dl-insts"] = true;369Features["atomic-ds-pk-add-16-insts"] = true;370Features["atomic-flat-pk-add-16-insts"] = true;371Features["atomic-buffer-global-pk-add-f16-insts"] = true;372Features["atomic-global-pk-add-bf16-inst"] = true;373Features["16-bit-insts"] = true;374Features["dpp"] = true;375Features["gfx8-insts"] = true;376Features["gfx9-insts"] = true;377Features["gfx10-insts"] = true;378Features["gfx10-3-insts"] = true;379Features["gfx11-insts"] = true;380Features["gfx12-insts"] = true;381Features["atomic-fadd-rtn-insts"] = true;382Features["image-insts"] = true;383Features["fp8-conversion-insts"] = true;384break;385case GK_GFX1152:386case GK_GFX1151:387case GK_GFX1150:388case GK_GFX1103:389case GK_GFX1102:390case GK_GFX1101:391case GK_GFX1100:392case GK_GFX11_GENERIC:393Features["ci-insts"] = true;394Features["dot5-insts"] = true;395Features["dot7-insts"] = true;396Features["dot8-insts"] = true;397Features["dot9-insts"] = true;398Features["dot10-insts"] = true;399Features["dl-insts"] = true;400Features["16-bit-insts"] = true;401Features["dpp"] = true;402Features["gfx8-insts"] = true;403Features["gfx9-insts"] = true;404Features["gfx10-insts"] = true;405Features["gfx10-3-insts"] = true;406Features["gfx11-insts"] = true;407Features["atomic-fadd-rtn-insts"] = true;408Features["image-insts"] = true;409Features["gws"] = true;410break;411case GK_GFX1036:412case GK_GFX1035:413case GK_GFX1034:414case GK_GFX1033:415case GK_GFX1032:416case GK_GFX1031:417case GK_GFX1030:418case GK_GFX10_3_GENERIC:419Features["ci-insts"] = true;420Features["dot1-insts"] = true;421Features["dot2-insts"] = true;422Features["dot5-insts"] = true;423Features["dot6-insts"] = true;424Features["dot7-insts"] = true;425Features["dot10-insts"] = true;426Features["dl-insts"] = true;427Features["16-bit-insts"] = true;428Features["dpp"] = true;429Features["gfx8-insts"] = true;430Features["gfx9-insts"] = true;431Features["gfx10-insts"] = true;432Features["gfx10-3-insts"] = true;433Features["image-insts"] = true;434Features["s-memrealtime"] = true;435Features["s-memtime-inst"] = true;436Features["gws"] = true;437break;438case GK_GFX1012:439case GK_GFX1011:440Features["dot1-insts"] = true;441Features["dot2-insts"] = true;442Features["dot5-insts"] = true;443Features["dot6-insts"] = true;444Features["dot7-insts"] = true;445Features["dot10-insts"] = true;446[[fallthrough]];447case GK_GFX1013:448case GK_GFX1010:449case GK_GFX10_1_GENERIC:450Features["dl-insts"] = true;451Features["ci-insts"] = true;452Features["16-bit-insts"] = true;453Features["dpp"] = true;454Features["gfx8-insts"] = true;455Features["gfx9-insts"] = true;456Features["gfx10-insts"] = true;457Features["image-insts"] = true;458Features["s-memrealtime"] = true;459Features["s-memtime-inst"] = true;460Features["gws"] = true;461break;462case GK_GFX942:463case GK_GFX941:464case GK_GFX940:465Features["gfx940-insts"] = true;466Features["fp8-insts"] = true;467Features["fp8-conversion-insts"] = true;468Features["atomic-ds-pk-add-16-insts"] = true;469Features["atomic-flat-pk-add-16-insts"] = true;470Features["atomic-global-pk-add-bf16-inst"] = true;471Features["gfx90a-insts"] = true;472Features["atomic-buffer-global-pk-add-f16-insts"] = true;473Features["atomic-fadd-rtn-insts"] = true;474Features["dot3-insts"] = true;475Features["dot4-insts"] = true;476Features["dot5-insts"] = true;477Features["dot6-insts"] = true;478Features["mai-insts"] = true;479Features["dl-insts"] = true;480Features["dot1-insts"] = true;481Features["dot2-insts"] = true;482Features["dot7-insts"] = true;483Features["dot10-insts"] = true;484Features["gfx9-insts"] = true;485Features["gfx8-insts"] = true;486Features["16-bit-insts"] = true;487Features["dpp"] = true;488Features["s-memrealtime"] = true;489Features["ci-insts"] = true;490Features["s-memtime-inst"] = true;491Features["gws"] = true;492break;493case GK_GFX90A:494Features["gfx90a-insts"] = true;495Features["atomic-buffer-global-pk-add-f16-insts"] = true;496Features["atomic-fadd-rtn-insts"] = true;497[[fallthrough]];498case GK_GFX908:499Features["dot3-insts"] = true;500Features["dot4-insts"] = true;501Features["dot5-insts"] = true;502Features["dot6-insts"] = true;503Features["mai-insts"] = true;504[[fallthrough]];505case GK_GFX906:506Features["dl-insts"] = true;507Features["dot1-insts"] = true;508Features["dot2-insts"] = true;509Features["dot7-insts"] = true;510Features["dot10-insts"] = true;511[[fallthrough]];512case GK_GFX90C:513case GK_GFX909:514case GK_GFX904:515case GK_GFX902:516case GK_GFX900:517case GK_GFX9_GENERIC:518Features["gfx9-insts"] = true;519[[fallthrough]];520case GK_GFX810:521case GK_GFX805:522case GK_GFX803:523case GK_GFX802:524case GK_GFX801:525Features["gfx8-insts"] = true;526Features["16-bit-insts"] = true;527Features["dpp"] = true;528Features["s-memrealtime"] = true;529[[fallthrough]];530case GK_GFX705:531case GK_GFX704:532case GK_GFX703:533case GK_GFX702:534case GK_GFX701:535case GK_GFX700:536Features["ci-insts"] = true;537[[fallthrough]];538case GK_GFX602:539case GK_GFX601:540case GK_GFX600:541Features["image-insts"] = true;542Features["s-memtime-inst"] = true;543Features["gws"] = true;544break;545case GK_NONE:546break;547default:548llvm_unreachable("Unhandled GPU!");549}550} else {551if (GPU.empty())552GPU = "r600";553554switch (llvm::AMDGPU::parseArchR600(GPU)) {555case GK_CAYMAN:556case GK_CYPRESS:557case GK_RV770:558case GK_RV670:559// TODO: Add fp64 when implemented.560break;561case GK_TURKS:562case GK_CAICOS:563case GK_BARTS:564case GK_SUMO:565case GK_REDWOOD:566case GK_JUNIPER:567case GK_CEDAR:568case GK_RV730:569case GK_RV710:570case GK_RS880:571case GK_R630:572case GK_R600:573break;574default:575llvm_unreachable("Unhandled GPU!");576}577}578}579580static bool isWave32Capable(StringRef GPU, const Triple &T) {581bool IsWave32Capable = false;582// XXX - What does the member GPU mean if device name string passed here?583if (T.isAMDGCN()) {584switch (parseArchAMDGCN(GPU)) {585case GK_GFX1201:586case GK_GFX1200:587case GK_GFX1152:588case GK_GFX1151:589case GK_GFX1150:590case GK_GFX1103:591case GK_GFX1102:592case GK_GFX1101:593case GK_GFX1100:594case GK_GFX1036:595case GK_GFX1035:596case GK_GFX1034:597case GK_GFX1033:598case GK_GFX1032:599case GK_GFX1031:600case GK_GFX1030:601case GK_GFX1012:602case GK_GFX1011:603case GK_GFX1013:604case GK_GFX1010:605case GK_GFX12_GENERIC:606case GK_GFX11_GENERIC:607case GK_GFX10_3_GENERIC:608case GK_GFX10_1_GENERIC:609IsWave32Capable = true;610break;611default:612break;613}614}615return IsWave32Capable;616}617618std::pair<FeatureError, StringRef>619AMDGPU::insertWaveSizeFeature(StringRef GPU, const Triple &T,620StringMap<bool> &Features) {621bool IsWave32Capable = isWave32Capable(GPU, T);622const bool IsNullGPU = GPU.empty();623const bool HaveWave32 = Features.count("wavefrontsize32");624const bool HaveWave64 = Features.count("wavefrontsize64");625if (HaveWave32 && HaveWave64) {626return {AMDGPU::INVALID_FEATURE_COMBINATION,627"'wavefrontsize32' and 'wavefrontsize64' are mutually exclusive"};628}629if (HaveWave32 && !IsNullGPU && !IsWave32Capable) {630return {AMDGPU::UNSUPPORTED_TARGET_FEATURE, "wavefrontsize32"};631}632// Don't assume any wavesize with an unknown subtarget.633if (!IsNullGPU) {634// Default to wave32 if available, or wave64 if not635if (!HaveWave32 && !HaveWave64) {636StringRef DefaultWaveSizeFeature =637IsWave32Capable ? "wavefrontsize32" : "wavefrontsize64";638Features.insert(std::make_pair(DefaultWaveSizeFeature, true));639}640}641return {NO_ERROR, StringRef()};642}643644645