| 1 | //===- DbiModuleList.cpp - PDB module information list --------------------===// | 
|---|
| 2 | // | 
|---|
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. | 
|---|
| 4 | // See https://llvm.org/LICENSE.txt for license information. | 
|---|
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception | 
|---|
| 6 | // | 
|---|
| 7 | //===----------------------------------------------------------------------===// | 
|---|
| 8 |  | 
|---|
| 9 | #include "llvm/DebugInfo/PDB/Native/DbiModuleList.h" | 
|---|
| 10 | #include "llvm/ADT/StringRef.h" | 
|---|
| 11 | #include "llvm/ADT/iterator_range.h" | 
|---|
| 12 | #include "llvm/DebugInfo/PDB/Native/RawError.h" | 
|---|
| 13 | #include "llvm/DebugInfo/PDB/Native/RawTypes.h" | 
|---|
| 14 | #include "llvm/Support/BinaryStreamReader.h" | 
|---|
| 15 | #include "llvm/Support/Error.h" | 
|---|
| 16 | #include <cassert> | 
|---|
| 17 | #include <cstddef> | 
|---|
| 18 | #include <cstdint> | 
|---|
| 19 |  | 
|---|
| 20 | using namespace llvm; | 
|---|
| 21 | using namespace llvm::pdb; | 
|---|
| 22 |  | 
|---|
| 23 | DbiModuleSourceFilesIterator::DbiModuleSourceFilesIterator( | 
|---|
| 24 | const DbiModuleList &Modules, uint32_t Modi, uint16_t Filei) | 
|---|
| 25 | : Modules(&Modules), Modi(Modi), Filei(Filei) { | 
|---|
| 26 | setValue(); | 
|---|
| 27 | } | 
|---|
| 28 |  | 
|---|
| 29 | bool DbiModuleSourceFilesIterator:: | 
|---|
| 30 | operator==(const DbiModuleSourceFilesIterator &R) const { | 
|---|
| 31 | // incompatible iterators are never equal | 
|---|
| 32 | if (!isCompatible(R)) | 
|---|
| 33 | return false; | 
|---|
| 34 |  | 
|---|
| 35 | // If they're compatible, and they're both ends, then they're equal. | 
|---|
| 36 | if (isEnd() && R.isEnd()) | 
|---|
| 37 | return true; | 
|---|
| 38 |  | 
|---|
| 39 | // If one is an end and the other is not, they're not equal. | 
|---|
| 40 | if (isEnd() != R.isEnd()) | 
|---|
| 41 | return false; | 
|---|
| 42 |  | 
|---|
| 43 | // Now we know: | 
|---|
| 44 | // - They're compatible | 
|---|
| 45 | // - They're not *both* end iterators | 
|---|
| 46 | // - Their endness is the same. | 
|---|
| 47 | // Thus, they're compatible iterators pointing to a valid file on the same | 
|---|
| 48 | // module.  All we need to check are the file indices. | 
|---|
| 49 | assert(Modules == R.Modules); | 
|---|
| 50 | assert(Modi == R.Modi); | 
|---|
| 51 | assert(!isEnd()); | 
|---|
| 52 | assert(!R.isEnd()); | 
|---|
| 53 |  | 
|---|
| 54 | return (Filei == R.Filei); | 
|---|
| 55 | } | 
|---|
| 56 |  | 
|---|
| 57 | bool DbiModuleSourceFilesIterator:: | 
|---|
| 58 | operator<(const DbiModuleSourceFilesIterator &R) const { | 
|---|
| 59 | assert(isCompatible(R)); | 
|---|
| 60 |  | 
|---|
| 61 | // It's not sufficient to compare the file indices, because default | 
|---|
| 62 | // constructed iterators could be equal to iterators with valid indices.  To | 
|---|
| 63 | // account for this, early-out if they're equal. | 
|---|
| 64 | if (*this == R) | 
|---|
| 65 | return false; | 
|---|
| 66 |  | 
|---|
| 67 | return Filei < R.Filei; | 
|---|
| 68 | } | 
|---|
| 69 |  | 
|---|
| 70 | std::ptrdiff_t DbiModuleSourceFilesIterator:: | 
|---|
| 71 | operator-(const DbiModuleSourceFilesIterator &R) const { | 
|---|
| 72 | assert(isCompatible(R)); | 
|---|
| 73 | assert(!(*this < R)); | 
|---|
| 74 |  | 
|---|
| 75 | // If they're both end iterators, the distance is 0. | 
|---|
| 76 | if (isEnd() && R.isEnd()) | 
|---|
| 77 | return 0; | 
|---|
| 78 |  | 
|---|
| 79 | assert(!R.isEnd()); | 
|---|
| 80 |  | 
|---|
| 81 | // At this point, R cannot be end, but *this can, which means that *this | 
|---|
| 82 | // might be a universal end iterator with none of its fields set.  So in that | 
|---|
| 83 | // case have to rely on R as the authority to figure out how many files there | 
|---|
| 84 | // are to compute the distance. | 
|---|
| 85 | uint32_t Thisi = Filei; | 
|---|
| 86 | if (isEnd()) { | 
|---|
| 87 | uint32_t RealModi = R.Modi; | 
|---|
| 88 | Thisi = R.Modules->getSourceFileCount(Modi: RealModi); | 
|---|
| 89 | } | 
|---|
| 90 |  | 
|---|
| 91 | assert(Thisi >= R.Filei); | 
|---|
| 92 | return Thisi - R.Filei; | 
|---|
| 93 | } | 
|---|
| 94 |  | 
|---|
| 95 | DbiModuleSourceFilesIterator &DbiModuleSourceFilesIterator:: | 
|---|
| 96 | operator+=(std::ptrdiff_t N) { | 
|---|
| 97 | assert(!isEnd()); | 
|---|
| 98 |  | 
|---|
| 99 | Filei += N; | 
|---|
| 100 | assert(Filei <= Modules->getSourceFileCount(Modi)); | 
|---|
| 101 | setValue(); | 
|---|
| 102 | return *this; | 
|---|
| 103 | } | 
|---|
| 104 |  | 
|---|
| 105 | DbiModuleSourceFilesIterator &DbiModuleSourceFilesIterator:: | 
|---|
| 106 | operator-=(std::ptrdiff_t N) { | 
|---|
| 107 | // Note that we can subtract from an end iterator, but not a universal end | 
|---|
| 108 | // iterator. | 
|---|
| 109 | assert(!isUniversalEnd()); | 
|---|
| 110 |  | 
|---|
| 111 | assert(N <= Filei); | 
|---|
| 112 |  | 
|---|
| 113 | Filei -= N; | 
|---|
| 114 | return *this; | 
|---|
| 115 | } | 
|---|
| 116 |  | 
|---|
| 117 | void DbiModuleSourceFilesIterator::setValue() { | 
|---|
| 118 | if (isEnd()) { | 
|---|
| 119 | ThisValue = ""; | 
|---|
| 120 | return; | 
|---|
| 121 | } | 
|---|
| 122 |  | 
|---|
| 123 | uint32_t Off = Modules->ModuleInitialFileIndex[Modi] + Filei; | 
|---|
| 124 | auto ExpectedValue = Modules->getFileName(Index: Off); | 
|---|
| 125 | if (!ExpectedValue) { | 
|---|
| 126 | consumeError(Err: ExpectedValue.takeError()); | 
|---|
| 127 | Filei = Modules->getSourceFileCount(Modi); | 
|---|
| 128 | } else | 
|---|
| 129 | ThisValue = *ExpectedValue; | 
|---|
| 130 | } | 
|---|
| 131 |  | 
|---|
| 132 | bool DbiModuleSourceFilesIterator::isEnd() const { | 
|---|
| 133 | if (isUniversalEnd()) | 
|---|
| 134 | return true; | 
|---|
| 135 |  | 
|---|
| 136 | assert(Modules); | 
|---|
| 137 | assert(Modi <= Modules->getModuleCount()); | 
|---|
| 138 | assert(Filei <= Modules->getSourceFileCount(Modi)); | 
|---|
| 139 |  | 
|---|
| 140 | if (Modi == Modules->getModuleCount()) | 
|---|
| 141 | return true; | 
|---|
| 142 | if (Filei == Modules->getSourceFileCount(Modi)) | 
|---|
| 143 | return true; | 
|---|
| 144 | return false; | 
|---|
| 145 | } | 
|---|
| 146 |  | 
|---|
| 147 | bool DbiModuleSourceFilesIterator::isUniversalEnd() const { return !Modules; } | 
|---|
| 148 |  | 
|---|
| 149 | bool DbiModuleSourceFilesIterator::isCompatible( | 
|---|
| 150 | const DbiModuleSourceFilesIterator &R) const { | 
|---|
| 151 | // Universal iterators are compatible with any other iterator. | 
|---|
| 152 | if (isUniversalEnd() || R.isUniversalEnd()) | 
|---|
| 153 | return true; | 
|---|
| 154 |  | 
|---|
| 155 | // At this point, neither iterator is a universal end iterator, although one | 
|---|
| 156 | // or both might be non-universal end iterators.  Regardless, the module index | 
|---|
| 157 | // is valid, so they are compatible if and only if they refer to the same | 
|---|
| 158 | // module. | 
|---|
| 159 | return Modi == R.Modi; | 
|---|
| 160 | } | 
|---|
| 161 |  | 
|---|
| 162 | Error DbiModuleList::initialize(BinaryStreamRef ModInfo, | 
|---|
| 163 | BinaryStreamRef FileInfo) { | 
|---|
| 164 | if (auto EC = initializeModInfo(ModInfo)) | 
|---|
| 165 | return EC; | 
|---|
| 166 | if (auto EC = initializeFileInfo(FileInfo)) | 
|---|
| 167 | return EC; | 
|---|
| 168 |  | 
|---|
| 169 | return Error::success(); | 
|---|
| 170 | } | 
|---|
| 171 |  | 
|---|
| 172 | Error DbiModuleList::initializeModInfo(BinaryStreamRef ModInfo) { | 
|---|
| 173 | ModInfoSubstream = ModInfo; | 
|---|
| 174 |  | 
|---|
| 175 | if (ModInfo.getLength() == 0) | 
|---|
| 176 | return Error::success(); | 
|---|
| 177 |  | 
|---|
| 178 | BinaryStreamReader Reader(ModInfo); | 
|---|
| 179 |  | 
|---|
| 180 | if (auto EC = Reader.readArray(Array&: Descriptors, Size: ModInfo.getLength())) | 
|---|
| 181 | return EC; | 
|---|
| 182 |  | 
|---|
| 183 | return Error::success(); | 
|---|
| 184 | } | 
|---|
| 185 |  | 
|---|
| 186 | Error DbiModuleList::initializeFileInfo(BinaryStreamRef FileInfo) { | 
|---|
| 187 | FileInfoSubstream = FileInfo; | 
|---|
| 188 |  | 
|---|
| 189 | if (FileInfo.getLength() == 0) | 
|---|
| 190 | return Error::success(); | 
|---|
| 191 |  | 
|---|
| 192 | BinaryStreamReader FISR(FileInfo); | 
|---|
| 193 | if (auto EC = FISR.readObject(Dest&: FileInfoHeader)) | 
|---|
| 194 | return EC; | 
|---|
| 195 |  | 
|---|
| 196 | // First is an array of `NumModules` module indices.  This does not seem to be | 
|---|
| 197 | // used for anything meaningful, so we ignore it. | 
|---|
| 198 | FixedStreamArray<support::ulittle16_t> ModuleIndices; | 
|---|
| 199 | if (auto EC = FISR.readArray(Array&: ModuleIndices, NumItems: FileInfoHeader->NumModules)) | 
|---|
| 200 | return EC; | 
|---|
| 201 | if (auto EC = FISR.readArray(Array&: ModFileCountArray, NumItems: FileInfoHeader->NumModules)) | 
|---|
| 202 | return EC; | 
|---|
| 203 |  | 
|---|
| 204 | // Compute the real number of source files.  We can't trust the value in | 
|---|
| 205 | // `FileInfoHeader->NumSourceFiles` because it is a unit16, and the sum of all | 
|---|
| 206 | // source file counts might be larger than a unit16.  So we compute the real | 
|---|
| 207 | // count by summing up the individual counts. | 
|---|
| 208 | uint32_t NumSourceFiles = 0; | 
|---|
| 209 | for (auto Count : ModFileCountArray) | 
|---|
| 210 | NumSourceFiles += Count; | 
|---|
| 211 |  | 
|---|
| 212 | // In the reference implementation, this array is where the pointer documented | 
|---|
| 213 | // at the definition of ModuleInfoHeader::FileNameOffs points to.  Note that | 
|---|
| 214 | // although the field in ModuleInfoHeader is ignored this array is not, as it | 
|---|
| 215 | // is the authority on where each filename begins in the names buffer. | 
|---|
| 216 | if (auto EC = FISR.readArray(Array&: FileNameOffsets, NumItems: NumSourceFiles)) | 
|---|
| 217 | return EC; | 
|---|
| 218 |  | 
|---|
| 219 | if (auto EC = FISR.readStreamRef(Ref&: NamesBuffer)) | 
|---|
| 220 | return EC; | 
|---|
| 221 |  | 
|---|
| 222 | auto DescriptorIter = Descriptors.begin(); | 
|---|
| 223 | uint32_t NextFileIndex = 0; | 
|---|
| 224 | ModuleInitialFileIndex.resize(new_size: FileInfoHeader->NumModules); | 
|---|
| 225 | ModuleDescriptorOffsets.resize(new_size: FileInfoHeader->NumModules); | 
|---|
| 226 | for (size_t I = 0; I < FileInfoHeader->NumModules; ++I) { | 
|---|
| 227 | assert(DescriptorIter != Descriptors.end()); | 
|---|
| 228 | ModuleInitialFileIndex[I] = NextFileIndex; | 
|---|
| 229 | ModuleDescriptorOffsets[I] = DescriptorIter.offset(); | 
|---|
| 230 |  | 
|---|
| 231 | NextFileIndex += ModFileCountArray[I]; | 
|---|
| 232 | ++DescriptorIter; | 
|---|
| 233 | } | 
|---|
| 234 |  | 
|---|
| 235 | assert(DescriptorIter == Descriptors.end()); | 
|---|
| 236 | assert(NextFileIndex == NumSourceFiles); | 
|---|
| 237 |  | 
|---|
| 238 | return Error::success(); | 
|---|
| 239 | } | 
|---|
| 240 |  | 
|---|
| 241 | uint32_t DbiModuleList::getModuleCount() const { | 
|---|
| 242 | // Workaround to avoid the crash until upstream issue is fixed: | 
|---|
| 243 | // https://github.com/llvm/llvm-project/issues/55214 | 
|---|
| 244 | return FileInfoHeader ? FileInfoHeader->NumModules : 0; | 
|---|
| 245 | } | 
|---|
| 246 |  | 
|---|
| 247 | uint32_t DbiModuleList::getSourceFileCount() const { | 
|---|
| 248 | return FileNameOffsets.size(); | 
|---|
| 249 | } | 
|---|
| 250 |  | 
|---|
| 251 | uint16_t DbiModuleList::getSourceFileCount(uint32_t Modi) const { | 
|---|
| 252 | return ModFileCountArray[Modi]; | 
|---|
| 253 | } | 
|---|
| 254 |  | 
|---|
| 255 | DbiModuleDescriptor DbiModuleList::getModuleDescriptor(uint32_t Modi) const { | 
|---|
| 256 | assert(Modi < getModuleCount()); | 
|---|
| 257 | uint32_t Offset = ModuleDescriptorOffsets[Modi]; | 
|---|
| 258 | auto Iter = Descriptors.at(Offset); | 
|---|
| 259 | assert(Iter != Descriptors.end()); | 
|---|
| 260 | return *Iter; | 
|---|
| 261 | } | 
|---|
| 262 |  | 
|---|
| 263 | iterator_range<DbiModuleSourceFilesIterator> | 
|---|
| 264 | DbiModuleList::source_files(uint32_t Modi) const { | 
|---|
| 265 | return make_range<DbiModuleSourceFilesIterator>( | 
|---|
| 266 | x: DbiModuleSourceFilesIterator(*this, Modi, 0), | 
|---|
| 267 | y: DbiModuleSourceFilesIterator()); | 
|---|
| 268 | } | 
|---|
| 269 |  | 
|---|
| 270 | Expected<StringRef> DbiModuleList::getFileName(uint32_t Index) const { | 
|---|
| 271 | BinaryStreamReader Names(NamesBuffer); | 
|---|
| 272 | if (Index >= getSourceFileCount()) | 
|---|
| 273 | return make_error<RawError>(Args: raw_error_code::index_out_of_bounds); | 
|---|
| 274 |  | 
|---|
| 275 | uint32_t FileOffset = FileNameOffsets[Index]; | 
|---|
| 276 | Names.setOffset(FileOffset); | 
|---|
| 277 | StringRef Name; | 
|---|
| 278 | if (auto EC = Names.readCString(Dest&: Name)) | 
|---|
| 279 | return std::move(EC); | 
|---|
| 280 | return Name; | 
|---|
| 281 | } | 
|---|
| 282 |  | 
|---|