1 | //===----- CGHLSLRuntime.cpp - Interface to HLSL Runtimes -----------------===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | // |
9 | // This provides an abstract class for HLSL code generation. Concrete |
10 | // subclasses of this implement code generation for specific HLSL |
11 | // runtime libraries. |
12 | // |
13 | //===----------------------------------------------------------------------===// |
14 | |
15 | #include "CGHLSLRuntime.h" |
16 | #include "CGDebugInfo.h" |
17 | #include "CodeGenFunction.h" |
18 | #include "CodeGenModule.h" |
19 | #include "TargetInfo.h" |
20 | #include "clang/AST/ASTContext.h" |
21 | #include "clang/AST/Decl.h" |
22 | #include "clang/AST/RecursiveASTVisitor.h" |
23 | #include "clang/AST/Type.h" |
24 | #include "clang/Basic/TargetOptions.h" |
25 | #include "llvm/ADT/SmallVector.h" |
26 | #include "llvm/Frontend/HLSL/HLSLRootSignatureUtils.h" |
27 | #include "llvm/IR/Constants.h" |
28 | #include "llvm/IR/DerivedTypes.h" |
29 | #include "llvm/IR/GlobalVariable.h" |
30 | #include "llvm/IR/LLVMContext.h" |
31 | #include "llvm/IR/Metadata.h" |
32 | #include "llvm/IR/Module.h" |
33 | #include "llvm/IR/Type.h" |
34 | #include "llvm/IR/Value.h" |
35 | #include "llvm/Support/Alignment.h" |
36 | #include "llvm/Support/ErrorHandling.h" |
37 | #include "llvm/Support/FormatVariadic.h" |
38 | |
39 | using namespace clang; |
40 | using namespace CodeGen; |
41 | using namespace clang::hlsl; |
42 | using namespace llvm; |
43 | |
44 | using llvm::hlsl::CBufferRowSizeInBytes; |
45 | |
46 | namespace { |
47 | |
48 | void addDxilValVersion(StringRef ValVersionStr, llvm::Module &M) { |
49 | // The validation of ValVersionStr is done at HLSLToolChain::TranslateArgs. |
50 | // Assume ValVersionStr is legal here. |
51 | VersionTuple Version; |
52 | if (Version.tryParse(string: ValVersionStr) || Version.getBuild() || |
53 | Version.getSubminor() || !Version.getMinor()) { |
54 | return; |
55 | } |
56 | |
57 | uint64_t Major = Version.getMajor(); |
58 | uint64_t Minor = *Version.getMinor(); |
59 | |
60 | auto &Ctx = M.getContext(); |
61 | IRBuilder<> B(M.getContext()); |
62 | MDNode *Val = MDNode::get(Context&: Ctx, MDs: {ConstantAsMetadata::get(C: B.getInt32(C: Major)), |
63 | ConstantAsMetadata::get(C: B.getInt32(C: Minor))}); |
64 | StringRef DXILValKey = "dx.valver" ; |
65 | auto *DXILValMD = M.getOrInsertNamedMetadata(Name: DXILValKey); |
66 | DXILValMD->addOperand(M: Val); |
67 | } |
68 | |
69 | void addRootSignature(llvm::dxbc::RootSignatureVersion RootSigVer, |
70 | ArrayRef<llvm::hlsl::rootsig::RootElement> Elements, |
71 | llvm::Function *Fn, llvm::Module &M) { |
72 | auto &Ctx = M.getContext(); |
73 | |
74 | llvm::hlsl::rootsig::MetadataBuilder RSBuilder(Ctx, Elements); |
75 | MDNode *RootSignature = RSBuilder.BuildRootSignature(); |
76 | |
77 | ConstantAsMetadata *Version = ConstantAsMetadata::get(C: ConstantInt::get( |
78 | Ty: llvm::Type::getInt32Ty(C&: Ctx), V: llvm::to_underlying(E: RootSigVer))); |
79 | MDNode *MDVals = |
80 | MDNode::get(Context&: Ctx, MDs: {ValueAsMetadata::get(V: Fn), RootSignature, Version}); |
81 | |
82 | StringRef RootSignatureValKey = "dx.rootsignatures" ; |
83 | auto *RootSignatureValMD = M.getOrInsertNamedMetadata(Name: RootSignatureValKey); |
84 | RootSignatureValMD->addOperand(M: MDVals); |
85 | } |
86 | |
87 | } // namespace |
88 | |
89 | llvm::Type * |
90 | CGHLSLRuntime::convertHLSLSpecificType(const Type *T, |
91 | SmallVector<int32_t> *Packoffsets) { |
92 | assert(T->isHLSLSpecificType() && "Not an HLSL specific type!" ); |
93 | |
94 | // Check if the target has a specific translation for this type first. |
95 | if (llvm::Type *TargetTy = |
96 | CGM.getTargetCodeGenInfo().getHLSLType(CGM, T, Packoffsets)) |
97 | return TargetTy; |
98 | |
99 | llvm_unreachable("Generic handling of HLSL types is not supported." ); |
100 | } |
101 | |
102 | llvm::Triple::ArchType CGHLSLRuntime::getArch() { |
103 | return CGM.getTarget().getTriple().getArch(); |
104 | } |
105 | |
106 | // Returns true if the type is an HLSL resource class or an array of them |
107 | static bool isResourceRecordTypeOrArrayOf(const clang::Type *Ty) { |
108 | while (const ConstantArrayType *CAT = dyn_cast<ConstantArrayType>(Val: Ty)) |
109 | Ty = CAT->getArrayElementTypeNoTypeQual(); |
110 | return Ty->isHLSLResourceRecord(); |
111 | } |
112 | |
113 | // Emits constant global variables for buffer constants declarations |
114 | // and creates metadata linking the constant globals with the buffer global. |
115 | void CGHLSLRuntime::emitBufferGlobalsAndMetadata(const HLSLBufferDecl *BufDecl, |
116 | llvm::GlobalVariable *BufGV) { |
117 | LLVMContext &Ctx = CGM.getLLVMContext(); |
118 | |
119 | // get the layout struct from constant buffer target type |
120 | llvm::Type *BufType = BufGV->getValueType(); |
121 | llvm::Type *BufLayoutType = |
122 | cast<llvm::TargetExtType>(Val: BufType)->getTypeParameter(i: 0); |
123 | llvm::StructType *LayoutStruct = cast<llvm::StructType>( |
124 | Val: cast<llvm::TargetExtType>(Val: BufLayoutType)->getTypeParameter(i: 0)); |
125 | |
126 | // Start metadata list associating the buffer global variable with its |
127 | // constatns |
128 | SmallVector<llvm::Metadata *> BufGlobals; |
129 | BufGlobals.push_back(Elt: ValueAsMetadata::get(V: BufGV)); |
130 | |
131 | const auto *ElemIt = LayoutStruct->element_begin(); |
132 | for (Decl *D : BufDecl->buffer_decls()) { |
133 | if (isa<CXXRecordDecl, EmptyDecl>(Val: D)) |
134 | // Nothing to do for this declaration. |
135 | continue; |
136 | if (isa<FunctionDecl>(Val: D)) { |
137 | // A function within an cbuffer is effectively a top-level function. |
138 | CGM.EmitTopLevelDecl(D); |
139 | continue; |
140 | } |
141 | VarDecl *VD = dyn_cast<VarDecl>(Val: D); |
142 | if (!VD) |
143 | continue; |
144 | |
145 | QualType VDTy = VD->getType(); |
146 | if (VDTy.getAddressSpace() != LangAS::hlsl_constant) { |
147 | if (VD->getStorageClass() == SC_Static || |
148 | VDTy.getAddressSpace() == LangAS::hlsl_groupshared || |
149 | isResourceRecordTypeOrArrayOf(Ty: VDTy.getTypePtr())) { |
150 | // Emit static and groupshared variables and resource classes inside |
151 | // cbuffer as regular globals |
152 | CGM.EmitGlobal(D: VD); |
153 | } else { |
154 | // Anything else that is not in the hlsl_constant address space must be |
155 | // an empty struct or a zero-sized array and can be ignored |
156 | assert(BufDecl->getASTContext().getTypeSize(VDTy) == 0 && |
157 | "constant buffer decl with non-zero sized type outside of " |
158 | "hlsl_constant address space" ); |
159 | } |
160 | continue; |
161 | } |
162 | |
163 | assert(ElemIt != LayoutStruct->element_end() && |
164 | "number of elements in layout struct does not match" ); |
165 | llvm::Type *LayoutType = *ElemIt++; |
166 | |
167 | // FIXME: handle resources inside user defined structs |
168 | // (llvm/wg-hlsl#175) |
169 | |
170 | // create global variable for the constant and to metadata list |
171 | GlobalVariable *ElemGV = |
172 | cast<GlobalVariable>(Val: CGM.GetAddrOfGlobalVar(D: VD, Ty: LayoutType)); |
173 | BufGlobals.push_back(Elt: ValueAsMetadata::get(V: ElemGV)); |
174 | } |
175 | assert(ElemIt == LayoutStruct->element_end() && |
176 | "number of elements in layout struct does not match" ); |
177 | |
178 | // add buffer metadata to the module |
179 | CGM.getModule() |
180 | .getOrInsertNamedMetadata(Name: "hlsl.cbs" ) |
181 | ->addOperand(M: MDNode::get(Context&: Ctx, MDs: BufGlobals)); |
182 | } |
183 | |
184 | // Creates resource handle type for the HLSL buffer declaration |
185 | static const clang::HLSLAttributedResourceType * |
186 | createBufferHandleType(const HLSLBufferDecl *BufDecl) { |
187 | ASTContext &AST = BufDecl->getASTContext(); |
188 | QualType QT = AST.getHLSLAttributedResourceType( |
189 | Wrapped: AST.HLSLResourceTy, |
190 | Contained: QualType(BufDecl->getLayoutStruct()->getTypeForDecl(), 0), |
191 | Attrs: HLSLAttributedResourceType::Attributes(ResourceClass::CBuffer)); |
192 | return cast<HLSLAttributedResourceType>(Val: QT.getTypePtr()); |
193 | } |
194 | |
195 | // Iterates over all declarations in the HLSL buffer and based on the |
196 | // packoffset or register(c#) annotations it fills outs the Layout |
197 | // vector with the user-specified layout offsets. |
198 | // The buffer offsets can be specified 2 ways: |
199 | // 1. declarations in cbuffer {} block can have a packoffset annotation |
200 | // (translates to HLSLPackOffsetAttr) |
201 | // 2. default constant buffer declarations at global scope can have |
202 | // register(c#) annotations (translates to HLSLResourceBindingAttr with |
203 | // RegisterType::C) |
204 | // It is not guaranteed that all declarations in a buffer have an annotation. |
205 | // For those where it is not specified a -1 value is added to the Layout |
206 | // vector. In the final layout these declarations will be placed at the end |
207 | // of the HLSL buffer after all of the elements with specified offset. |
208 | static void fillPackoffsetLayout(const HLSLBufferDecl *BufDecl, |
209 | SmallVector<int32_t> &Layout) { |
210 | assert(Layout.empty() && "expected empty vector for layout" ); |
211 | assert(BufDecl->hasValidPackoffset()); |
212 | |
213 | for (Decl *D : BufDecl->buffer_decls()) { |
214 | if (isa<CXXRecordDecl, EmptyDecl>(Val: D) || isa<FunctionDecl>(Val: D)) { |
215 | continue; |
216 | } |
217 | VarDecl *VD = dyn_cast<VarDecl>(Val: D); |
218 | if (!VD || VD->getType().getAddressSpace() != LangAS::hlsl_constant) |
219 | continue; |
220 | |
221 | if (!VD->hasAttrs()) { |
222 | Layout.push_back(Elt: -1); |
223 | continue; |
224 | } |
225 | |
226 | int32_t Offset = -1; |
227 | for (auto *Attr : VD->getAttrs()) { |
228 | if (auto *POA = dyn_cast<HLSLPackOffsetAttr>(Val: Attr)) { |
229 | Offset = POA->getOffsetInBytes(); |
230 | break; |
231 | } |
232 | auto *RBA = dyn_cast<HLSLResourceBindingAttr>(Val: Attr); |
233 | if (RBA && |
234 | RBA->getRegisterType() == HLSLResourceBindingAttr::RegisterType::C) { |
235 | Offset = RBA->getSlotNumber() * CBufferRowSizeInBytes; |
236 | break; |
237 | } |
238 | } |
239 | Layout.push_back(Elt: Offset); |
240 | } |
241 | } |
242 | |
243 | // Codegen for HLSLBufferDecl |
244 | void CGHLSLRuntime::addBuffer(const HLSLBufferDecl *BufDecl) { |
245 | |
246 | assert(BufDecl->isCBuffer() && "tbuffer codegen is not supported yet" ); |
247 | |
248 | // create resource handle type for the buffer |
249 | const clang::HLSLAttributedResourceType *ResHandleTy = |
250 | createBufferHandleType(BufDecl); |
251 | |
252 | // empty constant buffer is ignored |
253 | if (ResHandleTy->getContainedType()->getAsCXXRecordDecl()->isEmpty()) |
254 | return; |
255 | |
256 | // create global variable for the constant buffer |
257 | SmallVector<int32_t> Layout; |
258 | if (BufDecl->hasValidPackoffset()) |
259 | fillPackoffsetLayout(BufDecl, Layout); |
260 | |
261 | llvm::TargetExtType *TargetTy = |
262 | cast<llvm::TargetExtType>(Val: convertHLSLSpecificType( |
263 | T: ResHandleTy, Packoffsets: BufDecl->hasValidPackoffset() ? &Layout : nullptr)); |
264 | llvm::GlobalVariable *BufGV = new GlobalVariable( |
265 | TargetTy, /*isConstant*/ false, |
266 | GlobalValue::LinkageTypes::ExternalLinkage, PoisonValue::get(T: TargetTy), |
267 | llvm::formatv(Fmt: "{0}{1}" , Vals: BufDecl->getName(), |
268 | Vals: BufDecl->isCBuffer() ? ".cb" : ".tb" ), |
269 | GlobalValue::NotThreadLocal); |
270 | CGM.getModule().insertGlobalVariable(GV: BufGV); |
271 | |
272 | // Add globals for constant buffer elements and create metadata nodes |
273 | emitBufferGlobalsAndMetadata(BufDecl, BufGV); |
274 | |
275 | // Initialize cbuffer from binding (implicit or explicit) |
276 | HLSLResourceBindingAttr *RBA = BufDecl->getAttr<HLSLResourceBindingAttr>(); |
277 | assert(RBA && |
278 | "cbuffer/tbuffer should always have resource binding attribute" ); |
279 | initializeBufferFromBinding(BufDecl, GV: BufGV, RBA); |
280 | } |
281 | |
282 | llvm::TargetExtType * |
283 | CGHLSLRuntime::getHLSLBufferLayoutType(const RecordType *StructType) { |
284 | const auto Entry = LayoutTypes.find(Val: StructType); |
285 | if (Entry != LayoutTypes.end()) |
286 | return Entry->getSecond(); |
287 | return nullptr; |
288 | } |
289 | |
290 | void CGHLSLRuntime::addHLSLBufferLayoutType(const RecordType *StructType, |
291 | llvm::TargetExtType *LayoutTy) { |
292 | assert(getHLSLBufferLayoutType(StructType) == nullptr && |
293 | "layout type for this struct already exist" ); |
294 | LayoutTypes[StructType] = LayoutTy; |
295 | } |
296 | |
297 | void CGHLSLRuntime::finishCodeGen() { |
298 | auto &TargetOpts = CGM.getTarget().getTargetOpts(); |
299 | auto &CodeGenOpts = CGM.getCodeGenOpts(); |
300 | auto &LangOpts = CGM.getLangOpts(); |
301 | llvm::Module &M = CGM.getModule(); |
302 | Triple T(M.getTargetTriple()); |
303 | if (T.getArch() == Triple::ArchType::dxil) |
304 | addDxilValVersion(ValVersionStr: TargetOpts.DxilValidatorVersion, M); |
305 | if (CodeGenOpts.ResMayAlias) |
306 | M.setModuleFlag(Behavior: llvm::Module::ModFlagBehavior::Error, Key: "dx.resmayalias" , Val: 1); |
307 | |
308 | // NativeHalfType corresponds to the -fnative-half-type clang option which is |
309 | // aliased by clang-dxc's -enable-16bit-types option. This option is used to |
310 | // set the UseNativeLowPrecision DXIL module flag in the DirectX backend |
311 | if (LangOpts.NativeHalfType) |
312 | M.setModuleFlag(Behavior: llvm::Module::ModFlagBehavior::Error, Key: "dx.nativelowprec" , |
313 | Val: 1); |
314 | |
315 | generateGlobalCtorDtorCalls(); |
316 | } |
317 | |
318 | void clang::CodeGen::CGHLSLRuntime::setHLSLEntryAttributes( |
319 | const FunctionDecl *FD, llvm::Function *Fn) { |
320 | const auto *ShaderAttr = FD->getAttr<HLSLShaderAttr>(); |
321 | assert(ShaderAttr && "All entry functions must have a HLSLShaderAttr" ); |
322 | const StringRef ShaderAttrKindStr = "hlsl.shader" ; |
323 | Fn->addFnAttr(Kind: ShaderAttrKindStr, |
324 | Val: llvm::Triple::getEnvironmentTypeName(Kind: ShaderAttr->getType())); |
325 | if (HLSLNumThreadsAttr *NumThreadsAttr = FD->getAttr<HLSLNumThreadsAttr>()) { |
326 | const StringRef NumThreadsKindStr = "hlsl.numthreads" ; |
327 | std::string NumThreadsStr = |
328 | formatv(Fmt: "{0},{1},{2}" , Vals: NumThreadsAttr->getX(), Vals: NumThreadsAttr->getY(), |
329 | Vals: NumThreadsAttr->getZ()); |
330 | Fn->addFnAttr(Kind: NumThreadsKindStr, Val: NumThreadsStr); |
331 | } |
332 | if (HLSLWaveSizeAttr *WaveSizeAttr = FD->getAttr<HLSLWaveSizeAttr>()) { |
333 | const StringRef WaveSizeKindStr = "hlsl.wavesize" ; |
334 | std::string WaveSizeStr = |
335 | formatv(Fmt: "{0},{1},{2}" , Vals: WaveSizeAttr->getMin(), Vals: WaveSizeAttr->getMax(), |
336 | Vals: WaveSizeAttr->getPreferred()); |
337 | Fn->addFnAttr(Kind: WaveSizeKindStr, Val: WaveSizeStr); |
338 | } |
339 | // HLSL entry functions are materialized for module functions with |
340 | // HLSLShaderAttr attribute. SetLLVMFunctionAttributesForDefinition called |
341 | // later in the compiler-flow for such module functions is not aware of and |
342 | // hence not able to set attributes of the newly materialized entry functions. |
343 | // So, set attributes of entry function here, as appropriate. |
344 | if (CGM.getCodeGenOpts().OptimizationLevel == 0) |
345 | Fn->addFnAttr(Kind: llvm::Attribute::OptimizeNone); |
346 | Fn->addFnAttr(Kind: llvm::Attribute::NoInline); |
347 | } |
348 | |
349 | static Value *buildVectorInput(IRBuilder<> &B, Function *F, llvm::Type *Ty) { |
350 | if (const auto *VT = dyn_cast<FixedVectorType>(Val: Ty)) { |
351 | Value *Result = PoisonValue::get(T: Ty); |
352 | for (unsigned I = 0; I < VT->getNumElements(); ++I) { |
353 | Value *Elt = B.CreateCall(Callee: F, Args: {B.getInt32(C: I)}); |
354 | Result = B.CreateInsertElement(Vec: Result, NewElt: Elt, Idx: I); |
355 | } |
356 | return Result; |
357 | } |
358 | return B.CreateCall(Callee: F, Args: {B.getInt32(C: 0)}); |
359 | } |
360 | |
361 | static void addSPIRVBuiltinDecoration(llvm::GlobalVariable *GV, |
362 | unsigned BuiltIn) { |
363 | LLVMContext &Ctx = GV->getContext(); |
364 | IRBuilder<> B(GV->getContext()); |
365 | MDNode *Operands = MDNode::get( |
366 | Context&: Ctx, |
367 | MDs: {ConstantAsMetadata::get(C: B.getInt32(/* Spirv::Decoration::BuiltIn */ C: 11)), |
368 | ConstantAsMetadata::get(C: B.getInt32(C: BuiltIn))}); |
369 | MDNode *Decoration = MDNode::get(Context&: Ctx, MDs: {Operands}); |
370 | GV->addMetadata(Kind: "spirv.Decorations" , MD&: *Decoration); |
371 | } |
372 | |
373 | static llvm::Value *createSPIRVBuiltinLoad(IRBuilder<> &B, llvm::Module &M, |
374 | llvm::Type *Ty, const Twine &Name, |
375 | unsigned BuiltInID) { |
376 | auto *GV = new llvm::GlobalVariable( |
377 | M, Ty, /* isConstant= */ true, llvm::GlobalValue::ExternalLinkage, |
378 | /* Initializer= */ nullptr, Name, /* insertBefore= */ nullptr, |
379 | llvm::GlobalVariable::GeneralDynamicTLSModel, |
380 | /* AddressSpace */ 7, /* isExternallyInitialized= */ true); |
381 | addSPIRVBuiltinDecoration(GV, BuiltIn: BuiltInID); |
382 | GV->setVisibility(llvm::GlobalValue::HiddenVisibility); |
383 | return B.CreateLoad(Ty, Ptr: GV); |
384 | } |
385 | |
386 | llvm::Value *CGHLSLRuntime::emitInputSemantic(IRBuilder<> &B, |
387 | const ParmVarDecl &D, |
388 | llvm::Type *Ty) { |
389 | assert(D.hasAttrs() && "Entry parameter missing annotation attribute!" ); |
390 | if (D.hasAttr<HLSLSV_GroupIndexAttr>()) { |
391 | llvm::Function *GroupIndex = |
392 | CGM.getIntrinsic(IID: getFlattenedThreadIdInGroupIntrinsic()); |
393 | return B.CreateCall(Callee: FunctionCallee(GroupIndex)); |
394 | } |
395 | if (D.hasAttr<HLSLSV_DispatchThreadIDAttr>()) { |
396 | llvm::Function *ThreadIDIntrinsic = |
397 | CGM.getIntrinsic(IID: getThreadIdIntrinsic()); |
398 | return buildVectorInput(B, F: ThreadIDIntrinsic, Ty); |
399 | } |
400 | if (D.hasAttr<HLSLSV_GroupThreadIDAttr>()) { |
401 | llvm::Function *GroupThreadIDIntrinsic = |
402 | CGM.getIntrinsic(IID: getGroupThreadIdIntrinsic()); |
403 | return buildVectorInput(B, F: GroupThreadIDIntrinsic, Ty); |
404 | } |
405 | if (D.hasAttr<HLSLSV_GroupIDAttr>()) { |
406 | llvm::Function *GroupIDIntrinsic = CGM.getIntrinsic(IID: getGroupIdIntrinsic()); |
407 | return buildVectorInput(B, F: GroupIDIntrinsic, Ty); |
408 | } |
409 | if (D.hasAttr<HLSLSV_PositionAttr>()) { |
410 | if (getArch() == llvm::Triple::spirv) |
411 | return createSPIRVBuiltinLoad(B, M&: CGM.getModule(), Ty, Name: "sv_position" , |
412 | /* BuiltIn::Position */ BuiltInID: 0); |
413 | llvm_unreachable("SV_Position semantic not implemented for this target." ); |
414 | } |
415 | assert(false && "Unhandled parameter attribute" ); |
416 | return nullptr; |
417 | } |
418 | |
419 | void CGHLSLRuntime::emitEntryFunction(const FunctionDecl *FD, |
420 | llvm::Function *Fn) { |
421 | llvm::Module &M = CGM.getModule(); |
422 | llvm::LLVMContext &Ctx = M.getContext(); |
423 | auto *EntryTy = llvm::FunctionType::get(Result: llvm::Type::getVoidTy(C&: Ctx), isVarArg: false); |
424 | Function *EntryFn = |
425 | Function::Create(Ty: EntryTy, Linkage: Function::ExternalLinkage, N: FD->getName(), M: &M); |
426 | |
427 | // Copy function attributes over, we have no argument or return attributes |
428 | // that can be valid on the real entry. |
429 | AttributeList NewAttrs = AttributeList::get(C&: Ctx, Index: AttributeList::FunctionIndex, |
430 | Attrs: Fn->getAttributes().getFnAttrs()); |
431 | EntryFn->setAttributes(NewAttrs); |
432 | setHLSLEntryAttributes(FD, Fn: EntryFn); |
433 | |
434 | // Set the called function as internal linkage. |
435 | Fn->setLinkage(GlobalValue::InternalLinkage); |
436 | |
437 | BasicBlock *BB = BasicBlock::Create(Context&: Ctx, Name: "entry" , Parent: EntryFn); |
438 | IRBuilder<> B(BB); |
439 | llvm::SmallVector<Value *> Args; |
440 | |
441 | SmallVector<OperandBundleDef, 1> OB; |
442 | if (CGM.shouldEmitConvergenceTokens()) { |
443 | assert(EntryFn->isConvergent()); |
444 | llvm::Value *I = |
445 | B.CreateIntrinsic(ID: llvm::Intrinsic::experimental_convergence_entry, Args: {}); |
446 | llvm::Value *bundleArgs[] = {I}; |
447 | OB.emplace_back(Args: "convergencectrl" , Args&: bundleArgs); |
448 | } |
449 | |
450 | // FIXME: support struct parameters where semantics are on members. |
451 | // See: https://github.com/llvm/llvm-project/issues/57874 |
452 | unsigned SRetOffset = 0; |
453 | for (const auto &Param : Fn->args()) { |
454 | if (Param.hasStructRetAttr()) { |
455 | // FIXME: support output. |
456 | // See: https://github.com/llvm/llvm-project/issues/57874 |
457 | SRetOffset = 1; |
458 | Args.emplace_back(Args: PoisonValue::get(T: Param.getType())); |
459 | continue; |
460 | } |
461 | const ParmVarDecl *PD = FD->getParamDecl(i: Param.getArgNo() - SRetOffset); |
462 | Args.push_back(Elt: emitInputSemantic(B, D: *PD, Ty: Param.getType())); |
463 | } |
464 | |
465 | CallInst *CI = B.CreateCall(Callee: FunctionCallee(Fn), Args, OpBundles: OB); |
466 | CI->setCallingConv(Fn->getCallingConv()); |
467 | // FIXME: Handle codegen for return type semantics. |
468 | // See: https://github.com/llvm/llvm-project/issues/57875 |
469 | B.CreateRetVoid(); |
470 | |
471 | // Add and identify root signature to function, if applicable |
472 | for (const Attr *Attr : FD->getAttrs()) { |
473 | if (const auto *RSAttr = dyn_cast<RootSignatureAttr>(Val: Attr)) { |
474 | auto *RSDecl = RSAttr->getSignatureDecl(); |
475 | addRootSignature(RootSigVer: RSDecl->getVersion(), Elements: RSDecl->getRootElements(), Fn: EntryFn, |
476 | M); |
477 | } |
478 | } |
479 | } |
480 | |
481 | static void gatherFunctions(SmallVectorImpl<Function *> &Fns, llvm::Module &M, |
482 | bool CtorOrDtor) { |
483 | const auto *GV = |
484 | M.getNamedGlobal(Name: CtorOrDtor ? "llvm.global_ctors" : "llvm.global_dtors" ); |
485 | if (!GV) |
486 | return; |
487 | const auto *CA = dyn_cast<ConstantArray>(Val: GV->getInitializer()); |
488 | if (!CA) |
489 | return; |
490 | // The global_ctor array elements are a struct [Priority, Fn *, COMDat]. |
491 | // HLSL neither supports priorities or COMDat values, so we will check those |
492 | // in an assert but not handle them. |
493 | |
494 | for (const auto &Ctor : CA->operands()) { |
495 | if (isa<ConstantAggregateZero>(Val: Ctor)) |
496 | continue; |
497 | ConstantStruct *CS = cast<ConstantStruct>(Val: Ctor); |
498 | |
499 | assert(cast<ConstantInt>(CS->getOperand(0))->getValue() == 65535 && |
500 | "HLSL doesn't support setting priority for global ctors." ); |
501 | assert(isa<ConstantPointerNull>(CS->getOperand(2)) && |
502 | "HLSL doesn't support COMDat for global ctors." ); |
503 | Fns.push_back(Elt: cast<Function>(Val: CS->getOperand(i_nocapture: 1))); |
504 | } |
505 | } |
506 | |
507 | void CGHLSLRuntime::generateGlobalCtorDtorCalls() { |
508 | llvm::Module &M = CGM.getModule(); |
509 | SmallVector<Function *> CtorFns; |
510 | SmallVector<Function *> DtorFns; |
511 | gatherFunctions(Fns&: CtorFns, M, CtorOrDtor: true); |
512 | gatherFunctions(Fns&: DtorFns, M, CtorOrDtor: false); |
513 | |
514 | // Insert a call to the global constructor at the beginning of the entry block |
515 | // to externally exported functions. This is a bit of a hack, but HLSL allows |
516 | // global constructors, but doesn't support driver initialization of globals. |
517 | for (auto &F : M.functions()) { |
518 | if (!F.hasFnAttribute(Kind: "hlsl.shader" )) |
519 | continue; |
520 | auto *Token = getConvergenceToken(BB&: F.getEntryBlock()); |
521 | Instruction *IP = &*F.getEntryBlock().begin(); |
522 | SmallVector<OperandBundleDef, 1> OB; |
523 | if (Token) { |
524 | llvm::Value *bundleArgs[] = {Token}; |
525 | OB.emplace_back(Args: "convergencectrl" , Args&: bundleArgs); |
526 | IP = Token->getNextNode(); |
527 | } |
528 | IRBuilder<> B(IP); |
529 | for (auto *Fn : CtorFns) { |
530 | auto CI = B.CreateCall(Callee: FunctionCallee(Fn), Args: {}, OpBundles: OB); |
531 | CI->setCallingConv(Fn->getCallingConv()); |
532 | } |
533 | |
534 | // Insert global dtors before the terminator of the last instruction |
535 | B.SetInsertPoint(F.back().getTerminator()); |
536 | for (auto *Fn : DtorFns) { |
537 | auto CI = B.CreateCall(Callee: FunctionCallee(Fn), Args: {}, OpBundles: OB); |
538 | CI->setCallingConv(Fn->getCallingConv()); |
539 | } |
540 | } |
541 | |
542 | // No need to keep global ctors/dtors for non-lib profile after call to |
543 | // ctors/dtors added for entry. |
544 | Triple T(M.getTargetTriple()); |
545 | if (T.getEnvironment() != Triple::EnvironmentType::Library) { |
546 | if (auto *GV = M.getNamedGlobal(Name: "llvm.global_ctors" )) |
547 | GV->eraseFromParent(); |
548 | if (auto *GV = M.getNamedGlobal(Name: "llvm.global_dtors" )) |
549 | GV->eraseFromParent(); |
550 | } |
551 | } |
552 | |
553 | static void initializeBuffer(CodeGenModule &CGM, llvm::GlobalVariable *GV, |
554 | Intrinsic::ID IntrID, |
555 | ArrayRef<llvm::Value *> Args) { |
556 | |
557 | LLVMContext &Ctx = CGM.getLLVMContext(); |
558 | llvm::Function *InitResFunc = llvm::Function::Create( |
559 | Ty: llvm::FunctionType::get(Result: CGM.VoidTy, isVarArg: false), |
560 | Linkage: llvm::GlobalValue::InternalLinkage, |
561 | N: ("_init_buffer_" + GV->getName()).str(), M&: CGM.getModule()); |
562 | InitResFunc->addFnAttr(Kind: llvm::Attribute::AlwaysInline); |
563 | |
564 | llvm::BasicBlock *EntryBB = |
565 | llvm::BasicBlock::Create(Context&: Ctx, Name: "entry" , Parent: InitResFunc); |
566 | CGBuilderTy Builder(CGM, Ctx); |
567 | const DataLayout &DL = CGM.getModule().getDataLayout(); |
568 | Builder.SetInsertPoint(EntryBB); |
569 | |
570 | // Make sure the global variable is buffer resource handle |
571 | llvm::Type *HandleTy = GV->getValueType(); |
572 | assert(HandleTy->isTargetExtTy() && "unexpected type of the buffer global" ); |
573 | |
574 | llvm::Value *CreateHandle = Builder.CreateIntrinsic( |
575 | /*ReturnType=*/RetTy: HandleTy, ID: IntrID, Args, FMFSource: nullptr, |
576 | Name: Twine(GV->getName()).concat(Suffix: "_h" )); |
577 | |
578 | llvm::Value *HandleRef = Builder.CreateStructGEP(Ty: GV->getValueType(), Ptr: GV, Idx: 0); |
579 | Builder.CreateAlignedStore(Val: CreateHandle, Ptr: HandleRef, |
580 | Align: HandleRef->getPointerAlignment(DL)); |
581 | Builder.CreateRetVoid(); |
582 | |
583 | CGM.AddCXXGlobalInit(F: InitResFunc); |
584 | } |
585 | |
586 | void CGHLSLRuntime::initializeBufferFromBinding(const HLSLBufferDecl *BufDecl, |
587 | llvm::GlobalVariable *GV, |
588 | HLSLResourceBindingAttr *RBA) { |
589 | assert(RBA && "expect a nonnull binding attribute" ); |
590 | llvm::Type *Int1Ty = llvm::Type::getInt1Ty(C&: CGM.getLLVMContext()); |
591 | auto *NonUniform = llvm::ConstantInt::get(Ty: Int1Ty, V: false); |
592 | auto *Index = llvm::ConstantInt::get(Ty: CGM.IntTy, V: 0); |
593 | auto *RangeSize = llvm::ConstantInt::get(Ty: CGM.IntTy, V: 1); |
594 | auto *Space = llvm::ConstantInt::get(Ty: CGM.IntTy, V: RBA->getSpaceNumber()); |
595 | Value *Name = nullptr; |
596 | |
597 | llvm::Intrinsic::ID IntrinsicID = |
598 | RBA->hasRegisterSlot() |
599 | ? CGM.getHLSLRuntime().getCreateHandleFromBindingIntrinsic() |
600 | : CGM.getHLSLRuntime().getCreateHandleFromImplicitBindingIntrinsic(); |
601 | |
602 | std::string Str(BufDecl->getName()); |
603 | std::string GlobalName(Str + ".str" ); |
604 | Name = CGM.GetAddrOfConstantCString(Str, GlobalName: GlobalName.c_str()).getPointer(); |
605 | |
606 | // buffer with explicit binding |
607 | if (RBA->hasRegisterSlot()) { |
608 | auto *RegSlot = llvm::ConstantInt::get(Ty: CGM.IntTy, V: RBA->getSlotNumber()); |
609 | SmallVector<Value *> Args{Space, RegSlot, RangeSize, |
610 | Index, NonUniform, Name}; |
611 | initializeBuffer(CGM, GV, IntrID: IntrinsicID, Args); |
612 | } else { |
613 | // buffer with implicit binding |
614 | auto *OrderID = |
615 | llvm::ConstantInt::get(Ty: CGM.IntTy, V: RBA->getImplicitBindingOrderID()); |
616 | SmallVector<Value *> Args{OrderID, Space, RangeSize, |
617 | Index, NonUniform, Name}; |
618 | initializeBuffer(CGM, GV, IntrID: IntrinsicID, Args); |
619 | } |
620 | } |
621 | |
622 | void CGHLSLRuntime::handleGlobalVarDefinition(const VarDecl *VD, |
623 | llvm::GlobalVariable *GV) { |
624 | if (auto Attr = VD->getAttr<HLSLVkExtBuiltinInputAttr>()) |
625 | addSPIRVBuiltinDecoration(GV, BuiltIn: Attr->getBuiltIn()); |
626 | } |
627 | |
628 | llvm::Instruction *CGHLSLRuntime::getConvergenceToken(BasicBlock &BB) { |
629 | if (!CGM.shouldEmitConvergenceTokens()) |
630 | return nullptr; |
631 | |
632 | auto E = BB.end(); |
633 | for (auto I = BB.begin(); I != E; ++I) { |
634 | auto *II = dyn_cast<llvm::IntrinsicInst>(Val: &*I); |
635 | if (II && llvm::isConvergenceControlIntrinsic(IntrinsicID: II->getIntrinsicID())) { |
636 | return II; |
637 | } |
638 | } |
639 | llvm_unreachable("Convergence token should have been emitted." ); |
640 | return nullptr; |
641 | } |
642 | |
643 | class OpaqueValueVisitor : public RecursiveASTVisitor<OpaqueValueVisitor> { |
644 | public: |
645 | llvm::SmallPtrSet<OpaqueValueExpr *, 8> OVEs; |
646 | OpaqueValueVisitor() {} |
647 | |
648 | bool VisitOpaqueValueExpr(OpaqueValueExpr *E) { |
649 | OVEs.insert(Ptr: E); |
650 | return true; |
651 | } |
652 | }; |
653 | |
654 | void CGHLSLRuntime::emitInitListOpaqueValues(CodeGenFunction &CGF, |
655 | InitListExpr *E) { |
656 | |
657 | typedef CodeGenFunction::OpaqueValueMappingData OpaqueValueMappingData; |
658 | OpaqueValueVisitor Visitor; |
659 | Visitor.TraverseStmt(S: E); |
660 | for (auto *OVE : Visitor.OVEs) { |
661 | if (CGF.isOpaqueValueEmitted(E: OVE)) |
662 | continue; |
663 | if (OpaqueValueMappingData::shouldBindAsLValue(expr: OVE)) { |
664 | LValue LV = CGF.EmitLValue(E: OVE->getSourceExpr()); |
665 | OpaqueValueMappingData::bind(CGF, ov: OVE, lv: LV); |
666 | } else { |
667 | RValue RV = CGF.EmitAnyExpr(E: OVE->getSourceExpr()); |
668 | OpaqueValueMappingData::bind(CGF, ov: OVE, rv: RV); |
669 | } |
670 | } |
671 | } |
672 | |