| 1 | //===- NVVMReflect.cpp - NVVM Emulate conditional compilation -------------===// | 
|---|
| 2 | // | 
|---|
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | 
|---|
| 4 | // See https://llvm.org/LICENSE.txt for license information. | 
|---|
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | 
|---|
| 6 | // | 
|---|
| 7 | //===----------------------------------------------------------------------===// | 
|---|
| 8 | // | 
|---|
| 9 | // This pass replaces occurrences of __nvvm_reflect("foo") and llvm.nvvm.reflect | 
|---|
| 10 | // with an integer. | 
|---|
| 11 | // | 
|---|
| 12 | // We choose the value we use by looking at metadata in the module itself.  Note | 
|---|
| 13 | // that we intentionally only have one way to choose these values, because other | 
|---|
| 14 | // parts of LLVM (particularly, InstCombineCall) rely on being able to predict | 
|---|
| 15 | // the values chosen by this pass. | 
|---|
| 16 | // | 
|---|
| 17 | // If we see an unknown string, we replace its call with 0. | 
|---|
| 18 | // | 
|---|
| 19 | //===----------------------------------------------------------------------===// | 
|---|
| 20 |  | 
|---|
| 21 | #include "NVPTX.h" | 
|---|
| 22 | #include "llvm/ADT/SmallVector.h" | 
|---|
| 23 | #include "llvm/ADT/StringExtras.h" | 
|---|
| 24 | #include "llvm/Analysis/ConstantFolding.h" | 
|---|
| 25 | #include "llvm/CodeGen/CommandFlags.h" | 
|---|
| 26 | #include "llvm/IR/Constants.h" | 
|---|
| 27 | #include "llvm/IR/DerivedTypes.h" | 
|---|
| 28 | #include "llvm/IR/Function.h" | 
|---|
| 29 | #include "llvm/IR/Instructions.h" | 
|---|
| 30 | #include "llvm/IR/Intrinsics.h" | 
|---|
| 31 | #include "llvm/IR/IntrinsicsNVPTX.h" | 
|---|
| 32 | #include "llvm/IR/Module.h" | 
|---|
| 33 | #include "llvm/IR/PassManager.h" | 
|---|
| 34 | #include "llvm/IR/Type.h" | 
|---|
| 35 | #include "llvm/Pass.h" | 
|---|
| 36 | #include "llvm/Support/CommandLine.h" | 
|---|
| 37 | #include "llvm/Support/Debug.h" | 
|---|
| 38 | #include "llvm/Support/raw_ostream.h" | 
|---|
| 39 | #include "llvm/Transforms/Scalar.h" | 
|---|
| 40 | #include "llvm/Transforms/Utils/BasicBlockUtils.h" | 
|---|
| 41 | #include "llvm/Transforms/Utils/Local.h" | 
|---|
| 42 | #define NVVM_REFLECT_FUNCTION "__nvvm_reflect" | 
|---|
| 43 | #define NVVM_REFLECT_OCL_FUNCTION "__nvvm_reflect_ocl" | 
|---|
| 44 | // Argument of reflect call to retrive arch number | 
|---|
| 45 | #define CUDA_ARCH_NAME "__CUDA_ARCH" | 
|---|
| 46 | // Argument of reflect call to retrive ftz mode | 
|---|
| 47 | #define CUDA_FTZ_NAME "__CUDA_FTZ" | 
|---|
| 48 | // Name of module metadata where ftz mode is stored | 
|---|
| 49 | #define CUDA_FTZ_MODULE_NAME "nvvm-reflect-ftz" | 
|---|
| 50 |  | 
|---|
| 51 | using namespace llvm; | 
|---|
| 52 |  | 
|---|
| 53 | #define DEBUG_TYPE "nvvm-reflect" | 
|---|
| 54 |  | 
|---|
| 55 | namespace { | 
|---|
| 56 | class NVVMReflect { | 
|---|
| 57 | // Map from reflect function call arguments to the value to replace the call | 
|---|
| 58 | // with. Should include __CUDA_FTZ and __CUDA_ARCH values. | 
|---|
| 59 | StringMap<unsigned> ReflectMap; | 
|---|
| 60 | bool handleReflectFunction(Module &M, StringRef ReflectName); | 
|---|
| 61 | void populateReflectMap(Module &M); | 
|---|
| 62 | void foldReflectCall(CallInst *Call, Constant *NewValue); | 
|---|
| 63 |  | 
|---|
| 64 | public: | 
|---|
| 65 | // __CUDA_FTZ is assigned in `runOnModule` by checking nvvm-reflect-ftz module | 
|---|
| 66 | // metadata. | 
|---|
| 67 | explicit NVVMReflect(unsigned SmVersion) | 
|---|
| 68 | : ReflectMap({{CUDA_ARCH_NAME, SmVersion * 10}}) {} | 
|---|
| 69 | bool runOnModule(Module &M); | 
|---|
| 70 | }; | 
|---|
| 71 |  | 
|---|
| 72 | class NVVMReflectLegacyPass : public ModulePass { | 
|---|
| 73 | NVVMReflect Impl; | 
|---|
| 74 |  | 
|---|
| 75 | public: | 
|---|
| 76 | static char ID; | 
|---|
| 77 | NVVMReflectLegacyPass(unsigned SmVersion) : ModulePass(ID), Impl(SmVersion) {} | 
|---|
| 78 | bool runOnModule(Module &M) override; | 
|---|
| 79 | }; | 
|---|
| 80 | } // namespace | 
|---|
| 81 |  | 
|---|
| 82 | ModulePass *llvm::createNVVMReflectPass(unsigned SmVersion) { | 
|---|
| 83 | return new NVVMReflectLegacyPass(SmVersion); | 
|---|
| 84 | } | 
|---|
| 85 |  | 
|---|
| 86 | static cl::opt<bool> | 
|---|
| 87 | NVVMReflectEnabled( "nvvm-reflect-enable", cl::init(Val: true), cl::Hidden, | 
|---|
| 88 | cl::desc( "NVVM reflection, enabled by default")); | 
|---|
| 89 |  | 
|---|
| 90 | char NVVMReflectLegacyPass::ID = 0; | 
|---|
| 91 | INITIALIZE_PASS(NVVMReflectLegacyPass, "nvvm-reflect", | 
|---|
| 92 | "Replace occurrences of __nvvm_reflect() calls with 0/1", false, | 
|---|
| 93 | false) | 
|---|
| 94 |  | 
|---|
| 95 | // Allow users to specify additional key/value pairs to reflect. These key/value | 
|---|
| 96 | // pairs are the last to be added to the ReflectMap, and therefore will take | 
|---|
| 97 | // precedence over initial values (i.e. __CUDA_FTZ from module medadata and | 
|---|
| 98 | // __CUDA_ARCH from SmVersion). | 
|---|
| 99 | static cl::list<std::string> ReflectList( | 
|---|
| 100 | "nvvm-reflect-add", cl::value_desc( "name=<int>"), cl::Hidden, | 
|---|
| 101 | cl::desc( "A key=value pair. Replace __nvvm_reflect(name) with value."), | 
|---|
| 102 | cl::ValueRequired); | 
|---|
| 103 |  | 
|---|
| 104 | // Set the ReflectMap with, first, the value of __CUDA_FTZ from module metadata, | 
|---|
| 105 | // and then the key/value pairs from the command line. | 
|---|
| 106 | void NVVMReflect::populateReflectMap(Module &M) { | 
|---|
| 107 | if (auto *Flag = mdconst::extract_or_null<ConstantInt>( | 
|---|
| 108 | MD: M.getModuleFlag(CUDA_FTZ_MODULE_NAME))) | 
|---|
| 109 | ReflectMap[CUDA_FTZ_NAME] = Flag->getSExtValue(); | 
|---|
| 110 |  | 
|---|
| 111 | for (auto &Option : ReflectList) { | 
|---|
| 112 | LLVM_DEBUG(dbgs() << "ReflectOption : "<< Option << "\n"); | 
|---|
| 113 | StringRef OptionRef(Option); | 
|---|
| 114 | auto [Name, Val] = OptionRef.split(Separator: '='); | 
|---|
| 115 | if (Name.empty()) | 
|---|
| 116 | report_fatal_error(reason: Twine( "Empty name in nvvm-reflect-add option '") + | 
|---|
| 117 | Option + "'"); | 
|---|
| 118 | if (Val.empty()) | 
|---|
| 119 | report_fatal_error(reason: Twine( "Missing value in nvvm-reflect-add option '") + | 
|---|
| 120 | Option + "'"); | 
|---|
| 121 | unsigned ValInt; | 
|---|
| 122 | if (!to_integer(S: Val.trim(), Num&: ValInt, Base: 10)) | 
|---|
| 123 | report_fatal_error( | 
|---|
| 124 | reason: Twine( "integer value expected in nvvm-reflect-add option '") + | 
|---|
| 125 | Option + "'"); | 
|---|
| 126 | ReflectMap[Name] = ValInt; | 
|---|
| 127 | } | 
|---|
| 128 | } | 
|---|
| 129 |  | 
|---|
| 130 | /// Process a reflect function by finding all its calls and replacing them with | 
|---|
| 131 | /// appropriate constant values. For __CUDA_FTZ, uses the module flag value. | 
|---|
| 132 | /// For __CUDA_ARCH, uses SmVersion * 10. For all other strings, uses 0. | 
|---|
| 133 | bool NVVMReflect::handleReflectFunction(Module &M, StringRef ReflectName) { | 
|---|
| 134 | Function *F = M.getFunction(Name: ReflectName); | 
|---|
| 135 | if (!F) | 
|---|
| 136 | return false; | 
|---|
| 137 | assert(F->isDeclaration() && "_reflect function should not have a body"); | 
|---|
| 138 | assert(F->getReturnType()->isIntegerTy() && | 
|---|
| 139 | "_reflect's return type should be integer"); | 
|---|
| 140 |  | 
|---|
| 141 | const bool Changed = !F->use_empty(); | 
|---|
| 142 | for (User *U : make_early_inc_range(Range: F->users())) { | 
|---|
| 143 | // Reflect function calls look like: | 
|---|
| 144 | // @arch = private unnamed_addr addrspace(1) constant [12 x i8] | 
|---|
| 145 | // c"__CUDA_ARCH\00" call i32 @__nvvm_reflect(ptr addrspacecast (ptr | 
|---|
| 146 | // addrspace(1) @arch to ptr)) We need to extract the string argument from | 
|---|
| 147 | // the call (i.e. "__CUDA_ARCH") | 
|---|
| 148 | auto *Call = dyn_cast<CallInst>(Val: U); | 
|---|
| 149 | if (!Call) | 
|---|
| 150 | report_fatal_error( | 
|---|
| 151 | reason: "__nvvm_reflect can only be used in a call instruction"); | 
|---|
| 152 | if (Call->getNumOperands() != 2) | 
|---|
| 153 | report_fatal_error(reason: "__nvvm_reflect requires exactly one argument"); | 
|---|
| 154 |  | 
|---|
| 155 | auto *GlobalStr = | 
|---|
| 156 | dyn_cast<Constant>(Val: Call->getArgOperand(i: 0)->stripPointerCasts()); | 
|---|
| 157 | if (!GlobalStr) | 
|---|
| 158 | report_fatal_error(reason: "__nvvm_reflect argument must be a constant string"); | 
|---|
| 159 |  | 
|---|
| 160 | auto *ConstantStr = | 
|---|
| 161 | dyn_cast<ConstantDataSequential>(Val: GlobalStr->getOperand(i: 0)); | 
|---|
| 162 | if (!ConstantStr) | 
|---|
| 163 | report_fatal_error(reason: "__nvvm_reflect argument must be a string constant"); | 
|---|
| 164 | if (!ConstantStr->isCString()) | 
|---|
| 165 | report_fatal_error( | 
|---|
| 166 | reason: "__nvvm_reflect argument must be a null-terminated string"); | 
|---|
| 167 |  | 
|---|
| 168 | StringRef ReflectArg = ConstantStr->getAsString().drop_back(); | 
|---|
| 169 | if (ReflectArg.empty()) | 
|---|
| 170 | report_fatal_error(reason: "__nvvm_reflect argument cannot be empty"); | 
|---|
| 171 | // Now that we have extracted the string argument, we can look it up in the | 
|---|
| 172 | // ReflectMap | 
|---|
| 173 | unsigned ReflectVal = 0; // The default value is 0 | 
|---|
| 174 | if (ReflectMap.contains(Key: ReflectArg)) | 
|---|
| 175 | ReflectVal = ReflectMap[ReflectArg]; | 
|---|
| 176 |  | 
|---|
| 177 | LLVM_DEBUG(dbgs() << "Replacing call of reflect function "<< F->getName() | 
|---|
| 178 | << "("<< ReflectArg << ") with value "<< ReflectVal | 
|---|
| 179 | << "\n"); | 
|---|
| 180 | auto *NewValue = ConstantInt::get(Ty: Call->getType(), V: ReflectVal); | 
|---|
| 181 | foldReflectCall(Call, NewValue); | 
|---|
| 182 | Call->eraseFromParent(); | 
|---|
| 183 | } | 
|---|
| 184 |  | 
|---|
| 185 | // Remove the __nvvm_reflect function from the module | 
|---|
| 186 | F->eraseFromParent(); | 
|---|
| 187 | return Changed; | 
|---|
| 188 | } | 
|---|
| 189 |  | 
|---|
| 190 | void NVVMReflect::foldReflectCall(CallInst *Call, Constant *NewValue) { | 
|---|
| 191 | SmallVector<Instruction *, 8> Worklist; | 
|---|
| 192 | // Replace an instruction with a constant and add all users of the instruction | 
|---|
| 193 | // to the worklist | 
|---|
| 194 | auto ReplaceInstructionWithConst = [&](Instruction *I, Constant *C) { | 
|---|
| 195 | for (auto *U : I->users()) | 
|---|
| 196 | if (auto *UI = dyn_cast<Instruction>(Val: U)) | 
|---|
| 197 | Worklist.push_back(Elt: UI); | 
|---|
| 198 | I->replaceAllUsesWith(V: C); | 
|---|
| 199 | }; | 
|---|
| 200 |  | 
|---|
| 201 | ReplaceInstructionWithConst(Call, NewValue); | 
|---|
| 202 |  | 
|---|
| 203 | auto &DL = Call->getModule()->getDataLayout(); | 
|---|
| 204 | while (!Worklist.empty()) { | 
|---|
| 205 | auto *I = Worklist.pop_back_val(); | 
|---|
| 206 | if (auto *C = ConstantFoldInstruction(I, DL)) { | 
|---|
| 207 | ReplaceInstructionWithConst(I, C); | 
|---|
| 208 | if (isInstructionTriviallyDead(I)) | 
|---|
| 209 | I->eraseFromParent(); | 
|---|
| 210 | } else if (I->isTerminator()) { | 
|---|
| 211 | ConstantFoldTerminator(BB: I->getParent()); | 
|---|
| 212 | } | 
|---|
| 213 | } | 
|---|
| 214 | } | 
|---|
| 215 |  | 
|---|
| 216 | bool NVVMReflect::runOnModule(Module &M) { | 
|---|
| 217 | if (!NVVMReflectEnabled) | 
|---|
| 218 | return false; | 
|---|
| 219 | populateReflectMap(M); | 
|---|
| 220 | bool Changed = true; | 
|---|
| 221 | Changed |= handleReflectFunction(M, NVVM_REFLECT_FUNCTION); | 
|---|
| 222 | Changed |= handleReflectFunction(M, NVVM_REFLECT_OCL_FUNCTION); | 
|---|
| 223 | Changed |= | 
|---|
| 224 | handleReflectFunction(M, ReflectName: Intrinsic::getName(id: Intrinsic::nvvm_reflect)); | 
|---|
| 225 | return Changed; | 
|---|
| 226 | } | 
|---|
| 227 |  | 
|---|
| 228 | bool NVVMReflectLegacyPass::runOnModule(Module &M) { | 
|---|
| 229 | return Impl.runOnModule(M); | 
|---|
| 230 | } | 
|---|
| 231 |  | 
|---|
| 232 | PreservedAnalyses NVVMReflectPass::run(Module &M, ModuleAnalysisManager &AM) { | 
|---|
| 233 | return NVVMReflect(SmVersion).runOnModule(M) ? PreservedAnalyses::none() | 
|---|
| 234 | : PreservedAnalyses::all(); | 
|---|
| 235 | } | 
|---|
| 236 |  | 
|---|