| 1 | //===--- ObjectFilePCHContainerWriter.cpp -----------------------------===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | |
| 9 | #include "clang/CodeGen/ObjectFilePCHContainerWriter.h" |
| 10 | #include "CGDebugInfo.h" |
| 11 | #include "CodeGenModule.h" |
| 12 | #include "clang/AST/ASTContext.h" |
| 13 | #include "clang/AST/DeclObjC.h" |
| 14 | #include "clang/AST/Expr.h" |
| 15 | #include "clang/AST/RecursiveASTVisitor.h" |
| 16 | #include "clang/Basic/CodeGenOptions.h" |
| 17 | #include "clang/Basic/Diagnostic.h" |
| 18 | #include "clang/Basic/TargetInfo.h" |
| 19 | #include "clang/CodeGen/BackendUtil.h" |
| 20 | #include "clang/Frontend/CompilerInstance.h" |
| 21 | #include "clang/Lex/HeaderSearch.h" |
| 22 | #include "clang/Lex/Preprocessor.h" |
| 23 | #include "llvm/ADT/StringRef.h" |
| 24 | #include "llvm/IR/Constants.h" |
| 25 | #include "llvm/IR/DataLayout.h" |
| 26 | #include "llvm/IR/LLVMContext.h" |
| 27 | #include "llvm/IR/Module.h" |
| 28 | #include "llvm/MC/TargetRegistry.h" |
| 29 | #include "llvm/Object/COFF.h" |
| 30 | #include "llvm/Support/Path.h" |
| 31 | #include <memory> |
| 32 | #include <utility> |
| 33 | |
| 34 | using namespace clang; |
| 35 | |
| 36 | #define DEBUG_TYPE "pchcontainer" |
| 37 | |
| 38 | namespace { |
| 39 | class PCHContainerGenerator : public ASTConsumer { |
| 40 | CompilerInstance &CI; |
| 41 | DiagnosticsEngine &Diags; |
| 42 | const std::string MainFileName; |
| 43 | const std::string OutputFileName; |
| 44 | ASTContext *Ctx; |
| 45 | ModuleMap &MMap; |
| 46 | IntrusiveRefCntPtr<llvm::vfs::FileSystem> FS; |
| 47 | const HeaderSearchOptions &; |
| 48 | const PreprocessorOptions &PreprocessorOpts; |
| 49 | CodeGenOptions CodeGenOpts; |
| 50 | const TargetOptions TargetOpts; |
| 51 | LangOptions LangOpts; |
| 52 | std::unique_ptr<llvm::LLVMContext> VMContext; |
| 53 | std::unique_ptr<llvm::Module> M; |
| 54 | std::unique_ptr<CodeGen::CodeGenModule> Builder; |
| 55 | std::unique_ptr<raw_pwrite_stream> OS; |
| 56 | std::shared_ptr<PCHBuffer> Buffer; |
| 57 | |
| 58 | /// Visit every type and emit debug info for it. |
| 59 | struct DebugTypeVisitor : public RecursiveASTVisitor<DebugTypeVisitor> { |
| 60 | clang::CodeGen::CGDebugInfo &DI; |
| 61 | ASTContext &Ctx; |
| 62 | DebugTypeVisitor(clang::CodeGen::CGDebugInfo &DI, ASTContext &Ctx) |
| 63 | : DI(DI), Ctx(Ctx) {} |
| 64 | |
| 65 | /// Determine whether this type can be represented in DWARF. |
| 66 | static bool CanRepresent(const Type *Ty) { |
| 67 | return !Ty->isDependentType() && !Ty->isUndeducedType(); |
| 68 | } |
| 69 | |
| 70 | bool VisitImportDecl(ImportDecl *D) { |
| 71 | if (!D->getImportedOwningModule()) |
| 72 | DI.EmitImportDecl(ID: *D); |
| 73 | return true; |
| 74 | } |
| 75 | |
| 76 | bool VisitTypeDecl(TypeDecl *D) { |
| 77 | // TagDecls may be deferred until after all decls have been merged and we |
| 78 | // know the complete type. Pure forward declarations will be skipped, but |
| 79 | // they don't need to be emitted into the module anyway. |
| 80 | if (auto *TD = dyn_cast<TagDecl>(Val: D)) |
| 81 | if (!TD->isCompleteDefinition()) |
| 82 | return true; |
| 83 | |
| 84 | if (D->hasAttr<NoDebugAttr>()) |
| 85 | return true; |
| 86 | |
| 87 | QualType QualTy = Ctx.getTypeDeclType(Decl: D); |
| 88 | if (!QualTy.isNull() && CanRepresent(Ty: QualTy.getTypePtr())) |
| 89 | DI.getOrCreateStandaloneType(Ty: QualTy, Loc: D->getLocation()); |
| 90 | return true; |
| 91 | } |
| 92 | |
| 93 | bool VisitObjCInterfaceDecl(ObjCInterfaceDecl *D) { |
| 94 | QualType QualTy(D->getTypeForDecl(), 0); |
| 95 | if (!QualTy.isNull() && CanRepresent(Ty: QualTy.getTypePtr())) |
| 96 | DI.getOrCreateStandaloneType(Ty: QualTy, Loc: D->getLocation()); |
| 97 | return true; |
| 98 | } |
| 99 | |
| 100 | bool VisitFunctionDecl(FunctionDecl *D) { |
| 101 | // Skip deduction guides. |
| 102 | if (isa<CXXDeductionGuideDecl>(Val: D)) |
| 103 | return true; |
| 104 | |
| 105 | if (isa<CXXMethodDecl>(Val: D)) |
| 106 | // This is not yet supported. Constructing the `this' argument |
| 107 | // mandates a CodeGenFunction. |
| 108 | return true; |
| 109 | |
| 110 | SmallVector<QualType, 16> ArgTypes; |
| 111 | for (auto *i : D->parameters()) |
| 112 | ArgTypes.push_back(Elt: i->getType()); |
| 113 | QualType RetTy = D->getReturnType(); |
| 114 | QualType FnTy = Ctx.getFunctionType(ResultTy: RetTy, Args: ArgTypes, |
| 115 | EPI: FunctionProtoType::ExtProtoInfo()); |
| 116 | if (CanRepresent(Ty: FnTy.getTypePtr())) |
| 117 | DI.EmitFunctionDecl(GD: D, Loc: D->getLocation(), FnType: FnTy); |
| 118 | return true; |
| 119 | } |
| 120 | |
| 121 | bool VisitObjCMethodDecl(ObjCMethodDecl *D) { |
| 122 | if (!D->getClassInterface()) |
| 123 | return true; |
| 124 | |
| 125 | bool selfIsPseudoStrong, selfIsConsumed; |
| 126 | SmallVector<QualType, 16> ArgTypes; |
| 127 | ArgTypes.push_back(Elt: D->getSelfType(Context&: Ctx, OID: D->getClassInterface(), |
| 128 | selfIsPseudoStrong, selfIsConsumed)); |
| 129 | ArgTypes.push_back(Elt: Ctx.getObjCSelType()); |
| 130 | for (auto *i : D->parameters()) |
| 131 | ArgTypes.push_back(Elt: i->getType()); |
| 132 | QualType RetTy = D->getReturnType(); |
| 133 | QualType FnTy = Ctx.getFunctionType(ResultTy: RetTy, Args: ArgTypes, |
| 134 | EPI: FunctionProtoType::ExtProtoInfo()); |
| 135 | if (CanRepresent(Ty: FnTy.getTypePtr())) |
| 136 | DI.EmitFunctionDecl(GD: D, Loc: D->getLocation(), FnType: FnTy); |
| 137 | return true; |
| 138 | } |
| 139 | }; |
| 140 | |
| 141 | public: |
| 142 | PCHContainerGenerator(CompilerInstance &CI, const std::string &MainFileName, |
| 143 | const std::string &OutputFileName, |
| 144 | std::unique_ptr<raw_pwrite_stream> OS, |
| 145 | std::shared_ptr<PCHBuffer> Buffer) |
| 146 | : CI(CI), Diags(CI.getDiagnostics()), MainFileName(MainFileName), |
| 147 | OutputFileName(OutputFileName), Ctx(nullptr), |
| 148 | MMap(CI.getPreprocessor().getHeaderSearchInfo().getModuleMap()), |
| 149 | FS(&CI.getVirtualFileSystem()), |
| 150 | HeaderSearchOpts(CI.getHeaderSearchOpts()), |
| 151 | PreprocessorOpts(CI.getPreprocessorOpts()), |
| 152 | TargetOpts(CI.getTargetOpts()), LangOpts(CI.getLangOpts()), |
| 153 | OS(std::move(OS)), Buffer(std::move(Buffer)) { |
| 154 | // The debug info output isn't affected by CodeModel and |
| 155 | // ThreadModel, but the backend expects them to be nonempty. |
| 156 | CodeGenOpts.CodeModel = "default" ; |
| 157 | LangOpts.setThreadModel(LangOptions::ThreadModelKind::Single); |
| 158 | CodeGenOpts.DebugTypeExtRefs = true; |
| 159 | // When building a module MainFileName is the name of the modulemap file. |
| 160 | CodeGenOpts.MainFileName = |
| 161 | LangOpts.CurrentModule.empty() ? MainFileName : LangOpts.CurrentModule; |
| 162 | CodeGenOpts.setDebugInfo(llvm::codegenoptions::FullDebugInfo); |
| 163 | CodeGenOpts.setDebuggerTuning(CI.getCodeGenOpts().getDebuggerTuning()); |
| 164 | CodeGenOpts.DwarfVersion = CI.getCodeGenOpts().DwarfVersion; |
| 165 | CodeGenOpts.DebugCompilationDir = |
| 166 | CI.getInvocation().getCodeGenOpts().DebugCompilationDir; |
| 167 | CodeGenOpts.DebugPrefixMap = |
| 168 | CI.getInvocation().getCodeGenOpts().DebugPrefixMap; |
| 169 | CodeGenOpts.DebugStrictDwarf = CI.getCodeGenOpts().DebugStrictDwarf; |
| 170 | } |
| 171 | |
| 172 | ~PCHContainerGenerator() override = default; |
| 173 | |
| 174 | void Initialize(ASTContext &Context) override { |
| 175 | assert(!Ctx && "initialized multiple times" ); |
| 176 | |
| 177 | Ctx = &Context; |
| 178 | VMContext.reset(p: new llvm::LLVMContext()); |
| 179 | M.reset(p: new llvm::Module(MainFileName, *VMContext)); |
| 180 | M->setDataLayout(Ctx->getTargetInfo().getDataLayoutString()); |
| 181 | Builder.reset(p: new CodeGen::CodeGenModule( |
| 182 | *Ctx, FS, HeaderSearchOpts, PreprocessorOpts, CodeGenOpts, *M, Diags)); |
| 183 | |
| 184 | // Prepare CGDebugInfo to emit debug info for a clang module. |
| 185 | auto *DI = Builder->getModuleDebugInfo(); |
| 186 | StringRef ModuleName = llvm::sys::path::filename(path: MainFileName); |
| 187 | DI->setPCHDescriptor( |
| 188 | {ModuleName, "" , OutputFileName, ASTFileSignature::createDISentinel()}); |
| 189 | DI->setModuleMap(MMap); |
| 190 | } |
| 191 | |
| 192 | bool HandleTopLevelDecl(DeclGroupRef D) override { |
| 193 | if (Diags.hasErrorOccurred()) |
| 194 | return true; |
| 195 | |
| 196 | // Collect debug info for all decls in this group. |
| 197 | for (auto *I : D) |
| 198 | if (!I->isFromASTFile()) { |
| 199 | DebugTypeVisitor DTV(*Builder->getModuleDebugInfo(), *Ctx); |
| 200 | DTV.TraverseDecl(D: I); |
| 201 | } |
| 202 | return true; |
| 203 | } |
| 204 | |
| 205 | void HandleTopLevelDeclInObjCContainer(DeclGroupRef D) override { |
| 206 | HandleTopLevelDecl(D); |
| 207 | } |
| 208 | |
| 209 | void HandleTagDeclDefinition(TagDecl *D) override { |
| 210 | if (Diags.hasErrorOccurred()) |
| 211 | return; |
| 212 | |
| 213 | if (D->isFromASTFile()) |
| 214 | return; |
| 215 | |
| 216 | // Anonymous tag decls are deferred until we are building their declcontext. |
| 217 | if (D->getName().empty()) |
| 218 | return; |
| 219 | |
| 220 | // Defer tag decls until their declcontext is complete. |
| 221 | auto *DeclCtx = D->getDeclContext(); |
| 222 | while (DeclCtx) { |
| 223 | if (auto *D = dyn_cast<TagDecl>(Val: DeclCtx)) |
| 224 | if (!D->isCompleteDefinition()) |
| 225 | return; |
| 226 | DeclCtx = DeclCtx->getParent(); |
| 227 | } |
| 228 | |
| 229 | DebugTypeVisitor DTV(*Builder->getModuleDebugInfo(), *Ctx); |
| 230 | DTV.TraverseDecl(D); |
| 231 | Builder->UpdateCompletedType(TD: D); |
| 232 | } |
| 233 | |
| 234 | void HandleTagDeclRequiredDefinition(const TagDecl *D) override { |
| 235 | if (Diags.hasErrorOccurred()) |
| 236 | return; |
| 237 | |
| 238 | if (const RecordDecl *RD = dyn_cast<RecordDecl>(Val: D)) |
| 239 | Builder->getModuleDebugInfo()->completeRequiredType(RD); |
| 240 | } |
| 241 | |
| 242 | void HandleImplicitImportDecl(ImportDecl *D) override { |
| 243 | if (!D->getImportedOwningModule()) |
| 244 | Builder->getModuleDebugInfo()->EmitImportDecl(ID: *D); |
| 245 | } |
| 246 | |
| 247 | /// Emit a container holding the serialized AST. |
| 248 | void HandleTranslationUnit(ASTContext &Ctx) override { |
| 249 | assert(M && VMContext && Builder); |
| 250 | // Delete these on function exit. |
| 251 | std::unique_ptr<llvm::LLVMContext> VMContext = std::move(this->VMContext); |
| 252 | std::unique_ptr<llvm::Module> M = std::move(this->M); |
| 253 | std::unique_ptr<CodeGen::CodeGenModule> Builder = std::move(this->Builder); |
| 254 | |
| 255 | if (Diags.hasErrorOccurred()) |
| 256 | return; |
| 257 | |
| 258 | M->setTargetTriple(Ctx.getTargetInfo().getTriple()); |
| 259 | M->setDataLayout(Ctx.getTargetInfo().getDataLayoutString()); |
| 260 | |
| 261 | // PCH files don't have a signature field in the control block, |
| 262 | // but LLVM detects DWO CUs by looking for a non-zero DWO id. |
| 263 | // We use the lower 64 bits for debug info. |
| 264 | |
| 265 | uint64_t Signature = |
| 266 | Buffer->Signature ? Buffer->Signature.truncatedValue() : ~1ULL; |
| 267 | |
| 268 | Builder->getModuleDebugInfo()->setDwoId(Signature); |
| 269 | |
| 270 | // Finalize the Builder. |
| 271 | if (Builder) |
| 272 | Builder->Release(); |
| 273 | |
| 274 | // Ensure the target exists. |
| 275 | std::string Error; |
| 276 | auto Triple = Ctx.getTargetInfo().getTriple(); |
| 277 | if (!llvm::TargetRegistry::lookupTarget(TheTriple: Triple, Error)) |
| 278 | llvm::report_fatal_error(reason: llvm::Twine(Error)); |
| 279 | |
| 280 | // Emit the serialized Clang AST into its own section. |
| 281 | assert(Buffer->IsComplete && "serialization did not complete" ); |
| 282 | auto &SerializedAST = Buffer->Data; |
| 283 | auto Size = SerializedAST.size(); |
| 284 | |
| 285 | if (Triple.isOSBinFormatWasm()) { |
| 286 | // Emit __clangast in custom section instead of named data segment |
| 287 | // to find it while iterating sections. |
| 288 | // This could be avoided if all data segements (the wasm sense) were |
| 289 | // represented as their own sections (in the llvm sense). |
| 290 | // TODO: https://github.com/WebAssembly/tool-conventions/issues/138 |
| 291 | llvm::NamedMDNode *MD = |
| 292 | M->getOrInsertNamedMetadata(Name: "wasm.custom_sections" ); |
| 293 | llvm::Metadata *Ops[2] = { |
| 294 | llvm::MDString::get(Context&: *VMContext, Str: "__clangast" ), |
| 295 | llvm::MDString::get(Context&: *VMContext, |
| 296 | Str: StringRef(SerializedAST.data(), Size))}; |
| 297 | auto *NameAndContent = llvm::MDTuple::get(Context&: *VMContext, MDs: Ops); |
| 298 | MD->addOperand(M: NameAndContent); |
| 299 | } else { |
| 300 | auto Int8Ty = llvm::Type::getInt8Ty(C&: *VMContext); |
| 301 | auto *Ty = llvm::ArrayType::get(ElementType: Int8Ty, NumElements: Size); |
| 302 | auto *Data = llvm::ConstantDataArray::getString( |
| 303 | Context&: *VMContext, Initializer: StringRef(SerializedAST.data(), Size), |
| 304 | /*AddNull=*/false); |
| 305 | auto *ASTSym = new llvm::GlobalVariable( |
| 306 | *M, Ty, /*constant*/ true, llvm::GlobalVariable::InternalLinkage, |
| 307 | Data, "__clang_ast" ); |
| 308 | // The on-disk hashtable needs to be aligned. |
| 309 | ASTSym->setAlignment(llvm::Align(8)); |
| 310 | |
| 311 | // Mach-O also needs a segment name. |
| 312 | if (Triple.isOSBinFormatMachO()) |
| 313 | ASTSym->setSection("__CLANG,__clangast" ); |
| 314 | // COFF has an eight character length limit. |
| 315 | else if (Triple.isOSBinFormatCOFF()) |
| 316 | ASTSym->setSection("clangast" ); |
| 317 | else |
| 318 | ASTSym->setSection("__clangast" ); |
| 319 | } |
| 320 | |
| 321 | LLVM_DEBUG({ |
| 322 | // Print the IR for the PCH container to the debug output. |
| 323 | llvm::SmallString<0> Buffer; |
| 324 | clang::emitBackendOutput( |
| 325 | CI, CodeGenOpts, Ctx.getTargetInfo().getDataLayoutString(), M.get(), |
| 326 | BackendAction::Backend_EmitLL, FS, |
| 327 | std::make_unique<llvm::raw_svector_ostream>(Buffer)); |
| 328 | llvm::dbgs() << Buffer; |
| 329 | }); |
| 330 | |
| 331 | // Use the LLVM backend to emit the pch container. |
| 332 | clang::emitBackendOutput(CI, CGOpts&: CodeGenOpts, |
| 333 | TDesc: Ctx.getTargetInfo().getDataLayoutString(), M: M.get(), |
| 334 | Action: BackendAction::Backend_EmitObj, VFS: FS, OS: std::move(OS)); |
| 335 | |
| 336 | // Free the memory for the temporary buffer. |
| 337 | llvm::SmallVector<char, 0> Empty; |
| 338 | SerializedAST = std::move(Empty); |
| 339 | } |
| 340 | }; |
| 341 | |
| 342 | } // anonymous namespace |
| 343 | |
| 344 | std::unique_ptr<ASTConsumer> |
| 345 | ObjectFilePCHContainerWriter::CreatePCHContainerGenerator( |
| 346 | CompilerInstance &CI, const std::string &MainFileName, |
| 347 | const std::string &OutputFileName, |
| 348 | std::unique_ptr<llvm::raw_pwrite_stream> OS, |
| 349 | std::shared_ptr<PCHBuffer> Buffer) const { |
| 350 | return std::make_unique<PCHContainerGenerator>( |
| 351 | args&: CI, args: MainFileName, args: OutputFileName, args: std::move(OS), args&: Buffer); |
| 352 | } |
| 353 | |