1//=====-- NVPTXSubtarget.h - Define Subtarget for the NVPTX ---*- C++ -*--====//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file declares the NVPTX specific subclass of TargetSubtarget.
10//
11//===----------------------------------------------------------------------===//
12
13#ifndef LLVM_LIB_TARGET_NVPTX_NVPTXSUBTARGET_H
14#define LLVM_LIB_TARGET_NVPTX_NVPTXSUBTARGET_H
15
16#include "NVPTX.h"
17#include "NVPTXFrameLowering.h"
18#include "NVPTXISelLowering.h"
19#include "NVPTXInstrInfo.h"
20#include "NVPTXRegisterInfo.h"
21#include "llvm/CodeGen/SelectionDAGTargetInfo.h"
22#include "llvm/CodeGen/TargetSubtargetInfo.h"
23#include "llvm/IR/DataLayout.h"
24#include <string>
25
26#define GET_SUBTARGETINFO_HEADER
27#include "NVPTXGenSubtargetInfo.inc"
28
29namespace llvm {
30
31class NVPTXSubtarget : public NVPTXGenSubtargetInfo {
32 virtual void anchor();
33 std::string TargetName;
34
35 // PTX version x.y is represented as 10*x+y, e.g. 3.1 == 31
36 unsigned PTXVersion;
37
38 // Full SM version x.y is represented as 100*x+10*y+feature, e.g. 3.1 == 310
39 // sm_90a == 901
40 unsigned int FullSmVersion;
41
42 // SM version x.y is represented as 10*x+y, e.g. 3.1 == 31. Derived from
43 // FullSmVersion.
44 unsigned int SmVersion;
45
46 const NVPTXTargetMachine &TM;
47 NVPTXInstrInfo InstrInfo;
48 NVPTXTargetLowering TLInfo;
49 SelectionDAGTargetInfo TSInfo;
50
51 // NVPTX does not have any call stack frame, but need a NVPTX specific
52 // FrameLowering class because TargetFrameLowering is abstract.
53 NVPTXFrameLowering FrameLowering;
54
55public:
56 /// This constructor initializes the data members to match that
57 /// of the specified module.
58 ///
59 NVPTXSubtarget(const Triple &TT, const std::string &CPU,
60 const std::string &FS, const NVPTXTargetMachine &TM);
61
62 const TargetFrameLowering *getFrameLowering() const override {
63 return &FrameLowering;
64 }
65 const NVPTXInstrInfo *getInstrInfo() const override { return &InstrInfo; }
66 const NVPTXRegisterInfo *getRegisterInfo() const override {
67 return &InstrInfo.getRegisterInfo();
68 }
69 const NVPTXTargetLowering *getTargetLowering() const override {
70 return &TLInfo;
71 }
72 const SelectionDAGTargetInfo *getSelectionDAGInfo() const override {
73 return &TSInfo;
74 }
75
76 bool hasAtomAddF64() const { return SmVersion >= 60; }
77 bool hasAtomScope() const { return SmVersion >= 60; }
78 bool hasAtomBitwise64() const { return SmVersion >= 32; }
79 bool hasAtomMinMax64() const { return SmVersion >= 32; }
80 bool hasLDG() const { return SmVersion >= 32; }
81 inline bool hasHWROT32() const { return SmVersion >= 32; }
82 bool hasImageHandles() const;
83 bool hasFP16Math() const { return SmVersion >= 53; }
84 bool hasBF16Math() const { return SmVersion >= 80; }
85 bool allowFP16Math() const;
86 bool hasMaskOperator() const { return PTXVersion >= 71; }
87 bool hasNoReturn() const { return SmVersion >= 30 && PTXVersion >= 64; }
88 unsigned int getFullSmVersion() const { return FullSmVersion; }
89 unsigned int getSmVersion() const { return getFullSmVersion() / 10; }
90 // GPUs with "a" suffix have include architecture-accelerated features that
91 // are supported on the specified architecture only, hence such targets do not
92 // follow the onion layer model. hasAAFeatures() allows distinguishing such
93 // GPU variants from the base GPU architecture.
94 // - 0 represents base GPU model,
95 // - non-zero value identifies particular architecture-accelerated variant.
96 bool hasAAFeatures() const { return getFullSmVersion() % 10; }
97 std::string getTargetName() const { return TargetName; }
98
99 // Get maximum value of required alignments among the supported data types.
100 // From the PTX ISA doc, section 8.2.3:
101 // The memory consistency model relates operations executed on memory
102 // locations with scalar data-types, which have a maximum size and alignment
103 // of 64 bits. Memory operations with a vector data-type are modelled as a
104 // set of equivalent memory operations with a scalar data-type, executed in
105 // an unspecified order on the elements in the vector.
106 unsigned getMaxRequiredAlignment() const { return 8; }
107
108 unsigned getPTXVersion() const { return PTXVersion; }
109
110 NVPTXSubtarget &initializeSubtargetDependencies(StringRef CPU, StringRef FS);
111 void ParseSubtargetFeatures(StringRef CPU, StringRef TuneCPU, StringRef FS);
112};
113
114} // End llvm namespace
115
116#endif
117