|  | //===-- TargetParser - Parser for target features ---------------*- C++ -*-===// | 
|  | // | 
|  | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | 
|  | // See https://llvm.org/LICENSE.txt for license information. | 
|  | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | 
|  | // | 
|  | //===----------------------------------------------------------------------===// | 
|  | // | 
|  | // This file implements a target parser to recognise hardware features such as | 
|  | // FPU/CPU/ARCH names as well as specific support such as HDIV, etc. | 
|  | // | 
|  | //===----------------------------------------------------------------------===// | 
|  |  | 
|  | #include "llvm/TargetParser/TargetParser.h" | 
|  | #include "llvm/ADT/ArrayRef.h" | 
|  | #include "llvm/TargetParser/Triple.h" | 
|  |  | 
|  | using namespace llvm; | 
|  | using namespace AMDGPU; | 
|  |  | 
|  | namespace { | 
|  |  | 
|  | struct GPUInfo { | 
|  | StringLiteral Name; | 
|  | StringLiteral CanonicalName; | 
|  | AMDGPU::GPUKind Kind; | 
|  | unsigned Features; | 
|  | }; | 
|  |  | 
|  | constexpr GPUInfo R600GPUs[] = { | 
|  | // Name       Canonical    Kind        Features | 
|  | //            Name | 
|  | {{"r600"},    {"r600"},    GK_R600,    FEATURE_NONE }, | 
|  | {{"rv630"},   {"r600"},    GK_R600,    FEATURE_NONE }, | 
|  | {{"rv635"},   {"r600"},    GK_R600,    FEATURE_NONE }, | 
|  | {{"r630"},    {"r630"},    GK_R630,    FEATURE_NONE }, | 
|  | {{"rs780"},   {"rs880"},   GK_RS880,   FEATURE_NONE }, | 
|  | {{"rs880"},   {"rs880"},   GK_RS880,   FEATURE_NONE }, | 
|  | {{"rv610"},   {"rs880"},   GK_RS880,   FEATURE_NONE }, | 
|  | {{"rv620"},   {"rs880"},   GK_RS880,   FEATURE_NONE }, | 
|  | {{"rv670"},   {"rv670"},   GK_RV670,   FEATURE_NONE }, | 
|  | {{"rv710"},   {"rv710"},   GK_RV710,   FEATURE_NONE }, | 
|  | {{"rv730"},   {"rv730"},   GK_RV730,   FEATURE_NONE }, | 
|  | {{"rv740"},   {"rv770"},   GK_RV770,   FEATURE_NONE }, | 
|  | {{"rv770"},   {"rv770"},   GK_RV770,   FEATURE_NONE }, | 
|  | {{"cedar"},   {"cedar"},   GK_CEDAR,   FEATURE_NONE }, | 
|  | {{"palm"},    {"cedar"},   GK_CEDAR,   FEATURE_NONE }, | 
|  | {{"cypress"}, {"cypress"}, GK_CYPRESS, FEATURE_FMA  }, | 
|  | {{"hemlock"}, {"cypress"}, GK_CYPRESS, FEATURE_FMA  }, | 
|  | {{"juniper"}, {"juniper"}, GK_JUNIPER, FEATURE_NONE }, | 
|  | {{"redwood"}, {"redwood"}, GK_REDWOOD, FEATURE_NONE }, | 
|  | {{"sumo"},    {"sumo"},    GK_SUMO,    FEATURE_NONE }, | 
|  | {{"sumo2"},   {"sumo"},    GK_SUMO,    FEATURE_NONE }, | 
|  | {{"barts"},   {"barts"},   GK_BARTS,   FEATURE_NONE }, | 
|  | {{"caicos"},  {"caicos"},  GK_CAICOS,  FEATURE_NONE }, | 
|  | {{"aruba"},   {"cayman"},  GK_CAYMAN,  FEATURE_FMA  }, | 
|  | {{"cayman"},  {"cayman"},  GK_CAYMAN,  FEATURE_FMA  }, | 
|  | {{"turks"},   {"turks"},   GK_TURKS,   FEATURE_NONE } | 
|  | }; | 
|  |  | 
|  | // This table should be sorted by the value of GPUKind | 
|  | // Don't bother listing the implicitly true features | 
|  | constexpr GPUInfo AMDGCNGPUs[] = { | 
|  | // Name         Canonical    Kind        Features | 
|  | //              Name | 
|  | {{"gfx600"},    {"gfx600"},  GK_GFX600,  FEATURE_FAST_FMA_F32}, | 
|  | {{"tahiti"},    {"gfx600"},  GK_GFX600,  FEATURE_FAST_FMA_F32}, | 
|  | {{"gfx601"},    {"gfx601"},  GK_GFX601,  FEATURE_NONE}, | 
|  | {{"pitcairn"},  {"gfx601"},  GK_GFX601,  FEATURE_NONE}, | 
|  | {{"verde"},     {"gfx601"},  GK_GFX601,  FEATURE_NONE}, | 
|  | {{"gfx602"},    {"gfx602"},  GK_GFX602,  FEATURE_NONE}, | 
|  | {{"hainan"},    {"gfx602"},  GK_GFX602,  FEATURE_NONE}, | 
|  | {{"oland"},     {"gfx602"},  GK_GFX602,  FEATURE_NONE}, | 
|  | {{"gfx700"},    {"gfx700"},  GK_GFX700,  FEATURE_NONE}, | 
|  | {{"kaveri"},    {"gfx700"},  GK_GFX700,  FEATURE_NONE}, | 
|  | {{"gfx701"},    {"gfx701"},  GK_GFX701,  FEATURE_FAST_FMA_F32}, | 
|  | {{"hawaii"},    {"gfx701"},  GK_GFX701,  FEATURE_FAST_FMA_F32}, | 
|  | {{"gfx702"},    {"gfx702"},  GK_GFX702,  FEATURE_FAST_FMA_F32}, | 
|  | {{"gfx703"},    {"gfx703"},  GK_GFX703,  FEATURE_NONE}, | 
|  | {{"kabini"},    {"gfx703"},  GK_GFX703,  FEATURE_NONE}, | 
|  | {{"mullins"},   {"gfx703"},  GK_GFX703,  FEATURE_NONE}, | 
|  | {{"gfx704"},    {"gfx704"},  GK_GFX704,  FEATURE_NONE}, | 
|  | {{"bonaire"},   {"gfx704"},  GK_GFX704,  FEATURE_NONE}, | 
|  | {{"gfx705"},    {"gfx705"},  GK_GFX705,  FEATURE_NONE}, | 
|  | {{"gfx801"},    {"gfx801"},  GK_GFX801,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK}, | 
|  | {{"carrizo"},   {"gfx801"},  GK_GFX801,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK}, | 
|  | {{"gfx802"},    {"gfx802"},  GK_GFX802,  FEATURE_FAST_DENORMAL_F32}, | 
|  | {{"iceland"},   {"gfx802"},  GK_GFX802,  FEATURE_FAST_DENORMAL_F32}, | 
|  | {{"tonga"},     {"gfx802"},  GK_GFX802,  FEATURE_FAST_DENORMAL_F32}, | 
|  | {{"gfx803"},    {"gfx803"},  GK_GFX803,  FEATURE_FAST_DENORMAL_F32}, | 
|  | {{"fiji"},      {"gfx803"},  GK_GFX803,  FEATURE_FAST_DENORMAL_F32}, | 
|  | {{"polaris10"}, {"gfx803"},  GK_GFX803,  FEATURE_FAST_DENORMAL_F32}, | 
|  | {{"polaris11"}, {"gfx803"},  GK_GFX803,  FEATURE_FAST_DENORMAL_F32}, | 
|  | {{"gfx805"},    {"gfx805"},  GK_GFX805,  FEATURE_FAST_DENORMAL_F32}, | 
|  | {{"tongapro"},  {"gfx805"},  GK_GFX805,  FEATURE_FAST_DENORMAL_F32}, | 
|  | {{"gfx810"},    {"gfx810"},  GK_GFX810,  FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK}, | 
|  | {{"stoney"},    {"gfx810"},  GK_GFX810,  FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK}, | 
|  | {{"gfx900"},    {"gfx900"},  GK_GFX900,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK}, | 
|  | {{"gfx902"},    {"gfx902"},  GK_GFX902,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK}, | 
|  | {{"gfx904"},    {"gfx904"},  GK_GFX904,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK}, | 
|  | {{"gfx906"},    {"gfx906"},  GK_GFX906,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC}, | 
|  | {{"gfx908"},    {"gfx908"},  GK_GFX908,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC}, | 
|  | {{"gfx909"},    {"gfx909"},  GK_GFX909,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK}, | 
|  | {{"gfx90a"},    {"gfx90a"},  GK_GFX90A,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC}, | 
|  | {{"gfx90c"},    {"gfx90c"},  GK_GFX90C,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK}, | 
|  | {{"gfx940"},    {"gfx940"},  GK_GFX940,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC}, | 
|  | {{"gfx941"},    {"gfx941"},  GK_GFX941,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC}, | 
|  | {{"gfx942"},    {"gfx942"},  GK_GFX942,  FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_XNACK|FEATURE_SRAMECC}, | 
|  | {{"gfx1010"},   {"gfx1010"}, GK_GFX1010, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP}, | 
|  | {{"gfx1011"},   {"gfx1011"}, GK_GFX1011, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP}, | 
|  | {{"gfx1012"},   {"gfx1012"}, GK_GFX1012, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP}, | 
|  | {{"gfx1013"},   {"gfx1013"}, GK_GFX1013, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_XNACK|FEATURE_WGP}, | 
|  | {{"gfx1030"},   {"gfx1030"}, GK_GFX1030, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | {{"gfx1031"},   {"gfx1031"}, GK_GFX1031, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | {{"gfx1032"},   {"gfx1032"}, GK_GFX1032, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | {{"gfx1033"},   {"gfx1033"}, GK_GFX1033, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | {{"gfx1034"},   {"gfx1034"}, GK_GFX1034, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | {{"gfx1035"},   {"gfx1035"}, GK_GFX1035, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | {{"gfx1036"},   {"gfx1036"}, GK_GFX1036, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | {{"gfx1100"},   {"gfx1100"}, GK_GFX1100, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | {{"gfx1101"},   {"gfx1101"}, GK_GFX1101, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | {{"gfx1102"},   {"gfx1102"}, GK_GFX1102, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | {{"gfx1103"},   {"gfx1103"}, GK_GFX1103, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | {{"gfx1150"},   {"gfx1150"}, GK_GFX1150, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | {{"gfx1151"},   {"gfx1151"}, GK_GFX1151, FEATURE_FAST_FMA_F32|FEATURE_FAST_DENORMAL_F32|FEATURE_WAVE32|FEATURE_WGP}, | 
|  | }; | 
|  |  | 
|  | const GPUInfo *getArchEntry(AMDGPU::GPUKind AK, ArrayRef<GPUInfo> Table) { | 
|  | GPUInfo Search = { {""}, {""}, AK, AMDGPU::FEATURE_NONE }; | 
|  |  | 
|  | auto I = | 
|  | llvm::lower_bound(Table, Search, [](const GPUInfo &A, const GPUInfo &B) { | 
|  | return A.Kind < B.Kind; | 
|  | }); | 
|  |  | 
|  | if (I == Table.end()) | 
|  | return nullptr; | 
|  | return I; | 
|  | } | 
|  |  | 
|  | } // namespace | 
|  |  | 
|  | StringRef llvm::AMDGPU::getArchNameAMDGCN(GPUKind AK) { | 
|  | if (const auto *Entry = getArchEntry(AK, AMDGCNGPUs)) | 
|  | return Entry->CanonicalName; | 
|  | return ""; | 
|  | } | 
|  |  | 
|  | StringRef llvm::AMDGPU::getArchNameR600(GPUKind AK) { | 
|  | if (const auto *Entry = getArchEntry(AK, R600GPUs)) | 
|  | return Entry->CanonicalName; | 
|  | return ""; | 
|  | } | 
|  |  | 
|  | AMDGPU::GPUKind llvm::AMDGPU::parseArchAMDGCN(StringRef CPU) { | 
|  | for (const auto &C : AMDGCNGPUs) { | 
|  | if (CPU == C.Name) | 
|  | return C.Kind; | 
|  | } | 
|  |  | 
|  | return AMDGPU::GPUKind::GK_NONE; | 
|  | } | 
|  |  | 
|  | AMDGPU::GPUKind llvm::AMDGPU::parseArchR600(StringRef CPU) { | 
|  | for (const auto &C : R600GPUs) { | 
|  | if (CPU == C.Name) | 
|  | return C.Kind; | 
|  | } | 
|  |  | 
|  | return AMDGPU::GPUKind::GK_NONE; | 
|  | } | 
|  |  | 
|  | unsigned AMDGPU::getArchAttrAMDGCN(GPUKind AK) { | 
|  | if (const auto *Entry = getArchEntry(AK, AMDGCNGPUs)) | 
|  | return Entry->Features; | 
|  | return FEATURE_NONE; | 
|  | } | 
|  |  | 
|  | unsigned AMDGPU::getArchAttrR600(GPUKind AK) { | 
|  | if (const auto *Entry = getArchEntry(AK, R600GPUs)) | 
|  | return Entry->Features; | 
|  | return FEATURE_NONE; | 
|  | } | 
|  |  | 
|  | void AMDGPU::fillValidArchListAMDGCN(SmallVectorImpl<StringRef> &Values) { | 
|  | // XXX: Should this only report unique canonical names? | 
|  | for (const auto &C : AMDGCNGPUs) | 
|  | Values.push_back(C.Name); | 
|  | } | 
|  |  | 
|  | void AMDGPU::fillValidArchListR600(SmallVectorImpl<StringRef> &Values) { | 
|  | for (const auto &C : R600GPUs) | 
|  | Values.push_back(C.Name); | 
|  | } | 
|  |  | 
|  | AMDGPU::IsaVersion AMDGPU::getIsaVersion(StringRef GPU) { | 
|  | AMDGPU::GPUKind AK = parseArchAMDGCN(GPU); | 
|  | if (AK == AMDGPU::GPUKind::GK_NONE) { | 
|  | if (GPU == "generic-hsa") | 
|  | return {7, 0, 0}; | 
|  | if (GPU == "generic") | 
|  | return {6, 0, 0}; | 
|  | return {0, 0, 0}; | 
|  | } | 
|  |  | 
|  | switch (AK) { | 
|  | case GK_GFX600:  return {6, 0, 0}; | 
|  | case GK_GFX601:  return {6, 0, 1}; | 
|  | case GK_GFX602:  return {6, 0, 2}; | 
|  | case GK_GFX700:  return {7, 0, 0}; | 
|  | case GK_GFX701:  return {7, 0, 1}; | 
|  | case GK_GFX702:  return {7, 0, 2}; | 
|  | case GK_GFX703:  return {7, 0, 3}; | 
|  | case GK_GFX704:  return {7, 0, 4}; | 
|  | case GK_GFX705:  return {7, 0, 5}; | 
|  | case GK_GFX801:  return {8, 0, 1}; | 
|  | case GK_GFX802:  return {8, 0, 2}; | 
|  | case GK_GFX803:  return {8, 0, 3}; | 
|  | case GK_GFX805:  return {8, 0, 5}; | 
|  | case GK_GFX810:  return {8, 1, 0}; | 
|  | case GK_GFX900:  return {9, 0, 0}; | 
|  | case GK_GFX902:  return {9, 0, 2}; | 
|  | case GK_GFX904:  return {9, 0, 4}; | 
|  | case GK_GFX906:  return {9, 0, 6}; | 
|  | case GK_GFX908:  return {9, 0, 8}; | 
|  | case GK_GFX909:  return {9, 0, 9}; | 
|  | case GK_GFX90A:  return {9, 0, 10}; | 
|  | case GK_GFX90C:  return {9, 0, 12}; | 
|  | case GK_GFX940:  return {9, 4, 0}; | 
|  | case GK_GFX941:  return {9, 4, 1}; | 
|  | case GK_GFX942:  return {9, 4, 2}; | 
|  | case GK_GFX1010: return {10, 1, 0}; | 
|  | case GK_GFX1011: return {10, 1, 1}; | 
|  | case GK_GFX1012: return {10, 1, 2}; | 
|  | case GK_GFX1013: return {10, 1, 3}; | 
|  | case GK_GFX1030: return {10, 3, 0}; | 
|  | case GK_GFX1031: return {10, 3, 1}; | 
|  | case GK_GFX1032: return {10, 3, 2}; | 
|  | case GK_GFX1033: return {10, 3, 3}; | 
|  | case GK_GFX1034: return {10, 3, 4}; | 
|  | case GK_GFX1035: return {10, 3, 5}; | 
|  | case GK_GFX1036: return {10, 3, 6}; | 
|  | case GK_GFX1100: return {11, 0, 0}; | 
|  | case GK_GFX1101: return {11, 0, 1}; | 
|  | case GK_GFX1102: return {11, 0, 2}; | 
|  | case GK_GFX1103: return {11, 0, 3}; | 
|  | case GK_GFX1150: return {11, 5, 0}; | 
|  | case GK_GFX1151: return {11, 5, 1}; | 
|  | default:         return {0, 0, 0}; | 
|  | } | 
|  | } | 
|  |  | 
|  | StringRef AMDGPU::getCanonicalArchName(const Triple &T, StringRef Arch) { | 
|  | assert(T.isAMDGPU()); | 
|  | auto ProcKind = T.isAMDGCN() ? parseArchAMDGCN(Arch) : parseArchR600(Arch); | 
|  | if (ProcKind == GK_NONE) | 
|  | return StringRef(); | 
|  |  | 
|  | return T.isAMDGCN() ? getArchNameAMDGCN(ProcKind) : getArchNameR600(ProcKind); | 
|  | } | 
|  |  | 
|  | void AMDGPU::fillAMDGPUFeatureMap(StringRef GPU, const Triple &T, | 
|  | StringMap<bool> &Features) { | 
|  | // XXX - What does the member GPU mean if device name string passed here? | 
|  | if (T.isAMDGCN()) { | 
|  | switch (parseArchAMDGCN(GPU)) { | 
|  | case GK_GFX1151: | 
|  | case GK_GFX1150: | 
|  | case GK_GFX1103: | 
|  | case GK_GFX1102: | 
|  | case GK_GFX1101: | 
|  | case GK_GFX1100: | 
|  | Features["ci-insts"] = true; | 
|  | Features["dot5-insts"] = true; | 
|  | Features["dot7-insts"] = true; | 
|  | Features["dot8-insts"] = true; | 
|  | Features["dot9-insts"] = true; | 
|  | Features["dot10-insts"] = true; | 
|  | Features["dl-insts"] = true; | 
|  | Features["16-bit-insts"] = true; | 
|  | Features["dpp"] = true; | 
|  | Features["gfx8-insts"] = true; | 
|  | Features["gfx9-insts"] = true; | 
|  | Features["gfx10-insts"] = true; | 
|  | Features["gfx10-3-insts"] = true; | 
|  | Features["gfx11-insts"] = true; | 
|  | Features["atomic-fadd-rtn-insts"] = true; | 
|  | Features["image-insts"] = true; | 
|  | break; | 
|  | case GK_GFX1036: | 
|  | case GK_GFX1035: | 
|  | case GK_GFX1034: | 
|  | case GK_GFX1033: | 
|  | case GK_GFX1032: | 
|  | case GK_GFX1031: | 
|  | case GK_GFX1030: | 
|  | Features["ci-insts"] = true; | 
|  | Features["dot1-insts"] = true; | 
|  | Features["dot2-insts"] = true; | 
|  | Features["dot5-insts"] = true; | 
|  | Features["dot6-insts"] = true; | 
|  | Features["dot7-insts"] = true; | 
|  | Features["dot10-insts"] = true; | 
|  | Features["dl-insts"] = true; | 
|  | Features["16-bit-insts"] = true; | 
|  | Features["dpp"] = true; | 
|  | Features["gfx8-insts"] = true; | 
|  | Features["gfx9-insts"] = true; | 
|  | Features["gfx10-insts"] = true; | 
|  | Features["gfx10-3-insts"] = true; | 
|  | Features["image-insts"] = true; | 
|  | Features["s-memrealtime"] = true; | 
|  | Features["s-memtime-inst"] = true; | 
|  | break; | 
|  | case GK_GFX1012: | 
|  | case GK_GFX1011: | 
|  | Features["dot1-insts"] = true; | 
|  | Features["dot2-insts"] = true; | 
|  | Features["dot5-insts"] = true; | 
|  | Features["dot6-insts"] = true; | 
|  | Features["dot7-insts"] = true; | 
|  | Features["dot10-insts"] = true; | 
|  | [[fallthrough]]; | 
|  | case GK_GFX1013: | 
|  | case GK_GFX1010: | 
|  | Features["dl-insts"] = true; | 
|  | Features["ci-insts"] = true; | 
|  | Features["16-bit-insts"] = true; | 
|  | Features["dpp"] = true; | 
|  | Features["gfx8-insts"] = true; | 
|  | Features["gfx9-insts"] = true; | 
|  | Features["gfx10-insts"] = true; | 
|  | Features["image-insts"] = true; | 
|  | Features["s-memrealtime"] = true; | 
|  | Features["s-memtime-inst"] = true; | 
|  | break; | 
|  | case GK_GFX942: | 
|  | case GK_GFX941: | 
|  | case GK_GFX940: | 
|  | Features["gfx940-insts"] = true; | 
|  | Features["fp8-insts"] = true; | 
|  | Features["atomic-ds-pk-add-16-insts"] = true; | 
|  | Features["atomic-flat-pk-add-16-insts"] = true; | 
|  | Features["atomic-global-pk-add-bf16-inst"] = true; | 
|  | Features["gfx90a-insts"] = true; | 
|  | Features["atomic-buffer-global-pk-add-f16-insts"] = true; | 
|  | Features["atomic-fadd-rtn-insts"] = true; | 
|  | Features["dot3-insts"] = true; | 
|  | Features["dot4-insts"] = true; | 
|  | Features["dot5-insts"] = true; | 
|  | Features["dot6-insts"] = true; | 
|  | Features["mai-insts"] = true; | 
|  | Features["dl-insts"] = true; | 
|  | Features["dot1-insts"] = true; | 
|  | Features["dot2-insts"] = true; | 
|  | Features["dot7-insts"] = true; | 
|  | Features["dot10-insts"] = true; | 
|  | Features["gfx9-insts"] = true; | 
|  | Features["gfx8-insts"] = true; | 
|  | Features["16-bit-insts"] = true; | 
|  | Features["dpp"] = true; | 
|  | Features["s-memrealtime"] = true; | 
|  | Features["ci-insts"] = true; | 
|  | Features["s-memtime-inst"] = true; | 
|  | break; | 
|  | case GK_GFX90A: | 
|  | Features["gfx90a-insts"] = true; | 
|  | Features["atomic-buffer-global-pk-add-f16-insts"] = true; | 
|  | Features["atomic-fadd-rtn-insts"] = true; | 
|  | [[fallthrough]]; | 
|  | case GK_GFX908: | 
|  | Features["dot3-insts"] = true; | 
|  | Features["dot4-insts"] = true; | 
|  | Features["dot5-insts"] = true; | 
|  | Features["dot6-insts"] = true; | 
|  | Features["mai-insts"] = true; | 
|  | [[fallthrough]]; | 
|  | case GK_GFX906: | 
|  | Features["dl-insts"] = true; | 
|  | Features["dot1-insts"] = true; | 
|  | Features["dot2-insts"] = true; | 
|  | Features["dot7-insts"] = true; | 
|  | Features["dot10-insts"] = true; | 
|  | [[fallthrough]]; | 
|  | case GK_GFX90C: | 
|  | case GK_GFX909: | 
|  | case GK_GFX904: | 
|  | case GK_GFX902: | 
|  | case GK_GFX900: | 
|  | Features["gfx9-insts"] = true; | 
|  | [[fallthrough]]; | 
|  | case GK_GFX810: | 
|  | case GK_GFX805: | 
|  | case GK_GFX803: | 
|  | case GK_GFX802: | 
|  | case GK_GFX801: | 
|  | Features["gfx8-insts"] = true; | 
|  | Features["16-bit-insts"] = true; | 
|  | Features["dpp"] = true; | 
|  | Features["s-memrealtime"] = true; | 
|  | [[fallthrough]]; | 
|  | case GK_GFX705: | 
|  | case GK_GFX704: | 
|  | case GK_GFX703: | 
|  | case GK_GFX702: | 
|  | case GK_GFX701: | 
|  | case GK_GFX700: | 
|  | Features["ci-insts"] = true; | 
|  | [[fallthrough]]; | 
|  | case GK_GFX602: | 
|  | case GK_GFX601: | 
|  | case GK_GFX600: | 
|  | Features["image-insts"] = true; | 
|  | Features["s-memtime-inst"] = true; | 
|  | break; | 
|  | case GK_NONE: | 
|  | break; | 
|  | default: | 
|  | llvm_unreachable("Unhandled GPU!"); | 
|  | } | 
|  | } else { | 
|  | if (GPU.empty()) | 
|  | GPU = "r600"; | 
|  |  | 
|  | switch (llvm::AMDGPU::parseArchR600(GPU)) { | 
|  | case GK_CAYMAN: | 
|  | case GK_CYPRESS: | 
|  | case GK_RV770: | 
|  | case GK_RV670: | 
|  | // TODO: Add fp64 when implemented. | 
|  | break; | 
|  | case GK_TURKS: | 
|  | case GK_CAICOS: | 
|  | case GK_BARTS: | 
|  | case GK_SUMO: | 
|  | case GK_REDWOOD: | 
|  | case GK_JUNIPER: | 
|  | case GK_CEDAR: | 
|  | case GK_RV730: | 
|  | case GK_RV710: | 
|  | case GK_RS880: | 
|  | case GK_R630: | 
|  | case GK_R600: | 
|  | break; | 
|  | default: | 
|  | llvm_unreachable("Unhandled GPU!"); | 
|  | } | 
|  | } | 
|  | } | 
|  |  | 
|  | static bool isWave32Capable(StringRef GPU, const Triple &T) { | 
|  | bool IsWave32Capable = false; | 
|  | // XXX - What does the member GPU mean if device name string passed here? | 
|  | if (T.isAMDGCN()) { | 
|  | switch (parseArchAMDGCN(GPU)) { | 
|  | case GK_GFX1151: | 
|  | case GK_GFX1150: | 
|  | case GK_GFX1103: | 
|  | case GK_GFX1102: | 
|  | case GK_GFX1101: | 
|  | case GK_GFX1100: | 
|  | case GK_GFX1036: | 
|  | case GK_GFX1035: | 
|  | case GK_GFX1034: | 
|  | case GK_GFX1033: | 
|  | case GK_GFX1032: | 
|  | case GK_GFX1031: | 
|  | case GK_GFX1030: | 
|  | case GK_GFX1012: | 
|  | case GK_GFX1011: | 
|  | case GK_GFX1013: | 
|  | case GK_GFX1010: | 
|  | IsWave32Capable = true; | 
|  | break; | 
|  | default: | 
|  | break; | 
|  | } | 
|  | } | 
|  | return IsWave32Capable; | 
|  | } | 
|  |  | 
|  | bool AMDGPU::insertWaveSizeFeature(StringRef GPU, const Triple &T, | 
|  | StringMap<bool> &Features, | 
|  | std::string &ErrorMsg) { | 
|  | bool IsWave32Capable = isWave32Capable(GPU, T); | 
|  | const bool IsNullGPU = GPU.empty(); | 
|  | // FIXME: Not diagnosing wavefrontsize32 on wave64 only targets. | 
|  | const bool HaveWave32 = | 
|  | (IsWave32Capable || IsNullGPU) && Features.count("wavefrontsize32"); | 
|  | const bool HaveWave64 = Features.count("wavefrontsize64"); | 
|  | if (HaveWave32 && HaveWave64) { | 
|  | ErrorMsg = "'wavefrontsize32' and 'wavefrontsize64' are mutually exclusive"; | 
|  | return false; | 
|  | } | 
|  | // Don't assume any wavesize with an unknown subtarget. | 
|  | if (!IsNullGPU) { | 
|  | // Default to wave32 if available, or wave64 if not | 
|  | if (!HaveWave32 && !HaveWave64) { | 
|  | StringRef DefaultWaveSizeFeature = | 
|  | IsWave32Capable ? "wavefrontsize32" : "wavefrontsize64"; | 
|  | Features.insert(std::make_pair(DefaultWaveSizeFeature, true)); | 
|  | } | 
|  | } | 
|  | return true; | 
|  | } |