| 1 | //===--- DependencyFile.cpp - Generate dependency file --------------------===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | // |
| 9 | // This code generates dependency files. |
| 10 | // |
| 11 | //===----------------------------------------------------------------------===// |
| 12 | |
| 13 | #include "clang/Basic/FileManager.h" |
| 14 | #include "clang/Basic/SourceManager.h" |
| 15 | #include "clang/Frontend/DependencyOutputOptions.h" |
| 16 | #include "clang/Frontend/FrontendDiagnostic.h" |
| 17 | #include "clang/Frontend/Utils.h" |
| 18 | #include "clang/Lex/DirectoryLookup.h" |
| 19 | #include "clang/Lex/ModuleMap.h" |
| 20 | #include "clang/Lex/PPCallbacks.h" |
| 21 | #include "clang/Lex/Preprocessor.h" |
| 22 | #include "clang/Serialization/ASTReader.h" |
| 23 | #include "llvm/ADT/StringSet.h" |
| 24 | #include "llvm/Support/FileSystem.h" |
| 25 | #include "llvm/Support/Path.h" |
| 26 | #include "llvm/Support/raw_ostream.h" |
| 27 | #include <optional> |
| 28 | |
| 29 | using namespace clang; |
| 30 | |
| 31 | namespace { |
| 32 | struct DepCollectorPPCallbacks : public PPCallbacks { |
| 33 | DependencyCollector &DepCollector; |
| 34 | Preprocessor &PP; |
| 35 | DepCollectorPPCallbacks(DependencyCollector &L, Preprocessor &PP) |
| 36 | : DepCollector(L), PP(PP) {} |
| 37 | |
| 38 | void LexedFileChanged(FileID FID, LexedFileChangeReason Reason, |
| 39 | SrcMgr::CharacteristicKind FileType, FileID PrevFID, |
| 40 | SourceLocation Loc) override { |
| 41 | if (Reason != PPCallbacks::LexedFileChangeReason::EnterFile) |
| 42 | return; |
| 43 | |
| 44 | // Dependency generation really does want to go all the way to the |
| 45 | // file entry for a source location to find out what is depended on. |
| 46 | // We do not want #line markers to affect dependency generation! |
| 47 | if (std::optional<StringRef> Filename = |
| 48 | PP.getSourceManager().getNonBuiltinFilenameForID(FID)) |
| 49 | DepCollector.maybeAddDependency( |
| 50 | Filename: llvm::sys::path::remove_leading_dotslash(path: *Filename), |
| 51 | /*FromModule*/ false, IsSystem: isSystem(CK: FileType), /*IsModuleFile*/ false, |
| 52 | /*IsMissing*/ false); |
| 53 | } |
| 54 | |
| 55 | void FileSkipped(const FileEntryRef &SkippedFile, const Token &FilenameTok, |
| 56 | SrcMgr::CharacteristicKind FileType) override { |
| 57 | StringRef Filename = |
| 58 | llvm::sys::path::remove_leading_dotslash(path: SkippedFile.getName()); |
| 59 | DepCollector.maybeAddDependency(Filename, /*FromModule=*/false, |
| 60 | /*IsSystem=*/isSystem(CK: FileType), |
| 61 | /*IsModuleFile=*/false, |
| 62 | /*IsMissing=*/false); |
| 63 | } |
| 64 | |
| 65 | void EmbedDirective(SourceLocation, StringRef, bool, |
| 66 | OptionalFileEntryRef File, |
| 67 | const LexEmbedParametersResult &) override { |
| 68 | assert(File && "expected to only be called when the file is found" ); |
| 69 | StringRef FileName = |
| 70 | llvm::sys::path::remove_leading_dotslash(path: File->getName()); |
| 71 | DepCollector.maybeAddDependency(Filename: FileName, |
| 72 | /*FromModule*/ false, |
| 73 | /*IsSystem*/ false, |
| 74 | /*IsModuleFile*/ false, |
| 75 | /*IsMissing*/ false); |
| 76 | } |
| 77 | |
| 78 | void InclusionDirective(SourceLocation HashLoc, const Token &IncludeTok, |
| 79 | StringRef FileName, bool IsAngled, |
| 80 | CharSourceRange FilenameRange, |
| 81 | OptionalFileEntryRef File, StringRef SearchPath, |
| 82 | StringRef RelativePath, const Module *SuggestedModule, |
| 83 | bool ModuleImported, |
| 84 | SrcMgr::CharacteristicKind FileType) override { |
| 85 | if (!File) |
| 86 | DepCollector.maybeAddDependency(Filename: FileName, /*FromModule*/ false, |
| 87 | /*IsSystem*/ false, |
| 88 | /*IsModuleFile*/ false, |
| 89 | /*IsMissing*/ true); |
| 90 | // Files that actually exist are handled by FileChanged. |
| 91 | } |
| 92 | |
| 93 | void HasEmbed(SourceLocation, StringRef, bool, |
| 94 | OptionalFileEntryRef File) override { |
| 95 | if (!File) |
| 96 | return; |
| 97 | StringRef Filename = |
| 98 | llvm::sys::path::remove_leading_dotslash(path: File->getName()); |
| 99 | DepCollector.maybeAddDependency(Filename, |
| 100 | /*FromModule=*/false, IsSystem: false, |
| 101 | /*IsModuleFile=*/false, |
| 102 | /*IsMissing=*/false); |
| 103 | } |
| 104 | |
| 105 | void HasInclude(SourceLocation Loc, StringRef SpelledFilename, bool IsAngled, |
| 106 | OptionalFileEntryRef File, |
| 107 | SrcMgr::CharacteristicKind FileType) override { |
| 108 | if (!File) |
| 109 | return; |
| 110 | StringRef Filename = |
| 111 | llvm::sys::path::remove_leading_dotslash(path: File->getName()); |
| 112 | DepCollector.maybeAddDependency(Filename, /*FromModule=*/false, |
| 113 | /*IsSystem=*/isSystem(CK: FileType), |
| 114 | /*IsModuleFile=*/false, |
| 115 | /*IsMissing=*/false); |
| 116 | } |
| 117 | |
| 118 | void EndOfMainFile() override { |
| 119 | DepCollector.finishedMainFile(Diags&: PP.getDiagnostics()); |
| 120 | } |
| 121 | }; |
| 122 | |
| 123 | struct DepCollectorMMCallbacks : public ModuleMapCallbacks { |
| 124 | DependencyCollector &DepCollector; |
| 125 | DepCollectorMMCallbacks(DependencyCollector &DC) : DepCollector(DC) {} |
| 126 | |
| 127 | void moduleMapFileRead(SourceLocation Loc, FileEntryRef Entry, |
| 128 | bool IsSystem) override { |
| 129 | StringRef Filename = Entry.getName(); |
| 130 | DepCollector.maybeAddDependency(Filename, /*FromModule*/ false, |
| 131 | /*IsSystem*/ IsSystem, |
| 132 | /*IsModuleFile*/ false, |
| 133 | /*IsMissing*/ false); |
| 134 | } |
| 135 | }; |
| 136 | |
| 137 | struct DepCollectorASTListener : public ASTReaderListener { |
| 138 | DependencyCollector &DepCollector; |
| 139 | FileManager &FileMgr; |
| 140 | DepCollectorASTListener(DependencyCollector &L, FileManager &FileMgr) |
| 141 | : DepCollector(L), FileMgr(FileMgr) {} |
| 142 | bool needsInputFileVisitation() override { return true; } |
| 143 | bool needsSystemInputFileVisitation() override { |
| 144 | return DepCollector.needSystemDependencies(); |
| 145 | } |
| 146 | void visitModuleFile(StringRef Filename, |
| 147 | serialization::ModuleKind Kind) override { |
| 148 | DepCollector.maybeAddDependency(Filename, /*FromModule*/ true, |
| 149 | /*IsSystem*/ false, /*IsModuleFile*/ true, |
| 150 | /*IsMissing*/ false); |
| 151 | } |
| 152 | bool visitInputFile(StringRef Filename, bool IsSystem, |
| 153 | bool IsOverridden, bool IsExplicitModule) override { |
| 154 | if (IsOverridden || IsExplicitModule) |
| 155 | return true; |
| 156 | |
| 157 | // Run this through the FileManager in order to respect 'use-external-name' |
| 158 | // in case we have a VFS overlay. |
| 159 | if (auto FE = FileMgr.getOptionalFileRef(Filename)) |
| 160 | Filename = FE->getName(); |
| 161 | |
| 162 | DepCollector.maybeAddDependency(Filename, /*FromModule*/ true, IsSystem, |
| 163 | /*IsModuleFile*/ false, |
| 164 | /*IsMissing*/ false); |
| 165 | return true; |
| 166 | } |
| 167 | }; |
| 168 | } // end anonymous namespace |
| 169 | |
| 170 | void DependencyCollector::maybeAddDependency(StringRef Filename, |
| 171 | bool FromModule, bool IsSystem, |
| 172 | bool IsModuleFile, |
| 173 | bool IsMissing) { |
| 174 | if (sawDependency(Filename, FromModule, IsSystem, IsModuleFile, IsMissing)) |
| 175 | addDependency(Filename); |
| 176 | } |
| 177 | |
| 178 | bool DependencyCollector::addDependency(StringRef Filename) { |
| 179 | StringRef SearchPath; |
| 180 | #ifdef _WIN32 |
| 181 | // Make the search insensitive to case and separators. |
| 182 | llvm::SmallString<256> TmpPath = Filename; |
| 183 | llvm::sys::path::native(TmpPath); |
| 184 | std::transform(TmpPath.begin(), TmpPath.end(), TmpPath.begin(), ::tolower); |
| 185 | SearchPath = TmpPath.str(); |
| 186 | #else |
| 187 | SearchPath = Filename; |
| 188 | #endif |
| 189 | |
| 190 | if (Seen.insert(key: SearchPath).second) { |
| 191 | Dependencies.push_back(x: std::string(Filename)); |
| 192 | return true; |
| 193 | } |
| 194 | return false; |
| 195 | } |
| 196 | |
| 197 | static bool isSpecialFilename(StringRef Filename) { |
| 198 | return Filename == "<built-in>" ; |
| 199 | } |
| 200 | |
| 201 | bool DependencyCollector::sawDependency(StringRef Filename, bool FromModule, |
| 202 | bool IsSystem, bool IsModuleFile, |
| 203 | bool IsMissing) { |
| 204 | return !isSpecialFilename(Filename) && |
| 205 | (needSystemDependencies() || !IsSystem); |
| 206 | } |
| 207 | |
| 208 | DependencyCollector::~DependencyCollector() { } |
| 209 | void DependencyCollector::attachToPreprocessor(Preprocessor &PP) { |
| 210 | PP.addPPCallbacks(C: std::make_unique<DepCollectorPPCallbacks>(args&: *this, args&: PP)); |
| 211 | PP.getHeaderSearchInfo().getModuleMap().addModuleMapCallbacks( |
| 212 | Callback: std::make_unique<DepCollectorMMCallbacks>(args&: *this)); |
| 213 | } |
| 214 | void DependencyCollector::attachToASTReader(ASTReader &R) { |
| 215 | R.addListener( |
| 216 | L: std::make_unique<DepCollectorASTListener>(args&: *this, args&: R.getFileManager())); |
| 217 | } |
| 218 | |
| 219 | DependencyFileGenerator::DependencyFileGenerator( |
| 220 | const DependencyOutputOptions &Opts) |
| 221 | : OutputFile(Opts.OutputFile), Targets(Opts.Targets), |
| 222 | IncludeSystemHeaders(Opts.IncludeSystemHeaders), |
| 223 | PhonyTarget(Opts.UsePhonyTargets), |
| 224 | AddMissingHeaderDeps(Opts.AddMissingHeaderDeps), SeenMissingHeader(false), |
| 225 | IncludeModuleFiles(Opts.IncludeModuleFiles), |
| 226 | OutputFormat(Opts.OutputFormat), InputFileIndex(0) { |
| 227 | for (const auto & : Opts.ExtraDeps) { |
| 228 | if (addDependency(Filename: ExtraDep.first)) |
| 229 | ++InputFileIndex; |
| 230 | } |
| 231 | } |
| 232 | |
| 233 | void DependencyFileGenerator::attachToPreprocessor(Preprocessor &PP) { |
| 234 | // Disable the "file not found" diagnostic if the -MG option was given. |
| 235 | if (AddMissingHeaderDeps) |
| 236 | PP.SetSuppressIncludeNotFoundError(true); |
| 237 | |
| 238 | DependencyCollector::attachToPreprocessor(PP); |
| 239 | } |
| 240 | |
| 241 | bool DependencyFileGenerator::sawDependency(StringRef Filename, bool FromModule, |
| 242 | bool IsSystem, bool IsModuleFile, |
| 243 | bool IsMissing) { |
| 244 | if (IsMissing) { |
| 245 | // Handle the case of missing file from an inclusion directive. |
| 246 | if (AddMissingHeaderDeps) |
| 247 | return true; |
| 248 | SeenMissingHeader = true; |
| 249 | return false; |
| 250 | } |
| 251 | if (IsModuleFile && !IncludeModuleFiles) |
| 252 | return false; |
| 253 | |
| 254 | if (isSpecialFilename(Filename)) |
| 255 | return false; |
| 256 | |
| 257 | if (IncludeSystemHeaders) |
| 258 | return true; |
| 259 | |
| 260 | return !IsSystem; |
| 261 | } |
| 262 | |
| 263 | void DependencyFileGenerator::finishedMainFile(DiagnosticsEngine &Diags) { |
| 264 | outputDependencyFile(Diags); |
| 265 | } |
| 266 | |
| 267 | /// Print the filename, with escaping or quoting that accommodates the three |
| 268 | /// most likely tools that use dependency files: GNU Make, BSD Make, and |
| 269 | /// NMake/Jom. |
| 270 | /// |
| 271 | /// BSD Make is the simplest case: It does no escaping at all. This means |
| 272 | /// characters that are normally delimiters, i.e. space and # (the comment |
| 273 | /// character) simply aren't supported in filenames. |
| 274 | /// |
| 275 | /// GNU Make does allow space and # in filenames, but to avoid being treated |
| 276 | /// as a delimiter or comment, these must be escaped with a backslash. Because |
| 277 | /// backslash is itself the escape character, if a backslash appears in a |
| 278 | /// filename, it should be escaped as well. (As a special case, $ is escaped |
| 279 | /// as $$, which is the normal Make way to handle the $ character.) |
| 280 | /// For compatibility with BSD Make and historical practice, if GNU Make |
| 281 | /// un-escapes characters in a filename but doesn't find a match, it will |
| 282 | /// retry with the unmodified original string. |
| 283 | /// |
| 284 | /// GCC tries to accommodate both Make formats by escaping any space or # |
| 285 | /// characters in the original filename, but not escaping backslashes. The |
| 286 | /// apparent intent is so that filenames with backslashes will be handled |
| 287 | /// correctly by BSD Make, and by GNU Make in its fallback mode of using the |
| 288 | /// unmodified original string; filenames with # or space characters aren't |
| 289 | /// supported by BSD Make at all, but will be handled correctly by GNU Make |
| 290 | /// due to the escaping. |
| 291 | /// |
| 292 | /// A corner case that GCC gets only partly right is when the original filename |
| 293 | /// has a backslash immediately followed by space or #. GNU Make would expect |
| 294 | /// this backslash to be escaped; however GCC escapes the original backslash |
| 295 | /// only when followed by space, not #. It will therefore take a dependency |
| 296 | /// from a directive such as |
| 297 | /// #include "a\ b\#c.h" |
| 298 | /// and emit it as |
| 299 | /// a\\\ b\\#c.h |
| 300 | /// which GNU Make will interpret as |
| 301 | /// a\ b\ |
| 302 | /// followed by a comment. Failing to find this file, it will fall back to the |
| 303 | /// original string, which probably doesn't exist either; in any case it won't |
| 304 | /// find |
| 305 | /// a\ b\#c.h |
| 306 | /// which is the actual filename specified by the include directive. |
| 307 | /// |
| 308 | /// Clang does what GCC does, rather than what GNU Make expects. |
| 309 | /// |
| 310 | /// NMake/Jom has a different set of scary characters, but wraps filespecs in |
| 311 | /// double-quotes to avoid misinterpreting them; see |
| 312 | /// https://msdn.microsoft.com/en-us/library/dd9y37ha.aspx for NMake info, |
| 313 | /// https://msdn.microsoft.com/en-us/library/windows/desktop/aa365247(v=vs.85).aspx |
| 314 | /// for Windows file-naming info. |
| 315 | static void PrintFilename(raw_ostream &OS, StringRef Filename, |
| 316 | DependencyOutputFormat OutputFormat) { |
| 317 | // Convert filename to platform native path |
| 318 | llvm::SmallString<256> NativePath; |
| 319 | llvm::sys::path::native(path: Filename.str(), result&: NativePath); |
| 320 | |
| 321 | if (OutputFormat == DependencyOutputFormat::NMake) { |
| 322 | // Add quotes if needed. These are the characters listed as "special" to |
| 323 | // NMake, that are legal in a Windows filespec, and that could cause |
| 324 | // misinterpretation of the dependency string. |
| 325 | if (NativePath.find_first_of(Chars: " #${}^!" ) != StringRef::npos) |
| 326 | OS << '\"' << NativePath << '\"'; |
| 327 | else |
| 328 | OS << NativePath; |
| 329 | return; |
| 330 | } |
| 331 | assert(OutputFormat == DependencyOutputFormat::Make); |
| 332 | for (unsigned i = 0, e = NativePath.size(); i != e; ++i) { |
| 333 | if (NativePath[i] == '#') // Handle '#' the broken gcc way. |
| 334 | OS << '\\'; |
| 335 | else if (NativePath[i] == ' ') { // Handle space correctly. |
| 336 | OS << '\\'; |
| 337 | unsigned j = i; |
| 338 | while (j > 0 && NativePath[--j] == '\\') |
| 339 | OS << '\\'; |
| 340 | } else if (NativePath[i] == '$') // $ is escaped by $$. |
| 341 | OS << '$'; |
| 342 | OS << NativePath[i]; |
| 343 | } |
| 344 | } |
| 345 | |
| 346 | void DependencyFileGenerator::outputDependencyFile(DiagnosticsEngine &Diags) { |
| 347 | if (SeenMissingHeader) { |
| 348 | llvm::sys::fs::remove(path: OutputFile); |
| 349 | return; |
| 350 | } |
| 351 | |
| 352 | std::error_code EC; |
| 353 | llvm::raw_fd_ostream OS(OutputFile, EC, llvm::sys::fs::OF_TextWithCRLF); |
| 354 | if (EC) { |
| 355 | Diags.Report(DiagID: diag::err_fe_error_opening) << OutputFile << EC.message(); |
| 356 | return; |
| 357 | } |
| 358 | |
| 359 | outputDependencyFile(OS); |
| 360 | } |
| 361 | |
| 362 | void DependencyFileGenerator::outputDependencyFile(llvm::raw_ostream &OS) { |
| 363 | // Write out the dependency targets, trying to avoid overly long |
| 364 | // lines when possible. We try our best to emit exactly the same |
| 365 | // dependency file as GCC>=10, assuming the included files are the |
| 366 | // same. |
| 367 | const unsigned MaxColumns = 75; |
| 368 | unsigned Columns = 0; |
| 369 | |
| 370 | for (StringRef Target : Targets) { |
| 371 | unsigned N = Target.size(); |
| 372 | if (Columns == 0) { |
| 373 | Columns += N; |
| 374 | } else if (Columns + N + 2 > MaxColumns) { |
| 375 | Columns = N + 2; |
| 376 | OS << " \\\n " ; |
| 377 | } else { |
| 378 | Columns += N + 1; |
| 379 | OS << ' '; |
| 380 | } |
| 381 | // Targets already quoted as needed. |
| 382 | OS << Target; |
| 383 | } |
| 384 | |
| 385 | OS << ':'; |
| 386 | Columns += 1; |
| 387 | |
| 388 | // Now add each dependency in the order it was seen, but avoiding |
| 389 | // duplicates. |
| 390 | ArrayRef<std::string> Files = getDependencies(); |
| 391 | for (StringRef File : Files) { |
| 392 | if (File == "<stdin>" ) |
| 393 | continue; |
| 394 | // Start a new line if this would exceed the column limit. Make |
| 395 | // sure to leave space for a trailing " \" in case we need to |
| 396 | // break the line on the next iteration. |
| 397 | unsigned N = File.size(); |
| 398 | if (Columns + (N + 1) + 2 > MaxColumns) { |
| 399 | OS << " \\\n " ; |
| 400 | Columns = 2; |
| 401 | } |
| 402 | OS << ' '; |
| 403 | PrintFilename(OS, Filename: File, OutputFormat); |
| 404 | Columns += N + 1; |
| 405 | } |
| 406 | OS << '\n'; |
| 407 | |
| 408 | // Create phony targets if requested. |
| 409 | if (PhonyTarget && !Files.empty()) { |
| 410 | unsigned Index = 0; |
| 411 | for (auto I = Files.begin(), E = Files.end(); I != E; ++I) { |
| 412 | if (Index++ == InputFileIndex) |
| 413 | continue; |
| 414 | PrintFilename(OS, Filename: *I, OutputFormat); |
| 415 | OS << ":\n" ; |
| 416 | } |
| 417 | } |
| 418 | } |
| 419 | |