| 1 | //===--- WhitespaceManager.cpp - Format C++ code --------------------------===// |
| 2 | // |
| 3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
| 4 | // See https://llvm.org/LICENSE.txt for license information. |
| 5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
| 6 | // |
| 7 | //===----------------------------------------------------------------------===// |
| 8 | /// |
| 9 | /// \file |
| 10 | /// This file implements WhitespaceManager class. |
| 11 | /// |
| 12 | //===----------------------------------------------------------------------===// |
| 13 | |
| 14 | #include "WhitespaceManager.h" |
| 15 | #include "llvm/ADT/STLExtras.h" |
| 16 | #include "llvm/ADT/SmallVector.h" |
| 17 | #include <algorithm> |
| 18 | #include <optional> |
| 19 | |
| 20 | namespace clang { |
| 21 | namespace format { |
| 22 | |
| 23 | bool WhitespaceManager::Change::IsBeforeInFile::operator()( |
| 24 | const Change &C1, const Change &C2) const { |
| 25 | return SourceMgr.isBeforeInTranslationUnit( |
| 26 | LHS: C1.OriginalWhitespaceRange.getBegin(), |
| 27 | RHS: C2.OriginalWhitespaceRange.getBegin()) || |
| 28 | (C1.OriginalWhitespaceRange.getBegin() == |
| 29 | C2.OriginalWhitespaceRange.getBegin() && |
| 30 | SourceMgr.isBeforeInTranslationUnit( |
| 31 | LHS: C1.OriginalWhitespaceRange.getEnd(), |
| 32 | RHS: C2.OriginalWhitespaceRange.getEnd())); |
| 33 | } |
| 34 | |
| 35 | WhitespaceManager::Change::Change(const FormatToken &Tok, |
| 36 | bool CreateReplacement, |
| 37 | SourceRange OriginalWhitespaceRange, |
| 38 | int Spaces, unsigned StartOfTokenColumn, |
| 39 | unsigned IndentedFromColumn, |
| 40 | unsigned NewlinesBefore, |
| 41 | StringRef PreviousLinePostfix, |
| 42 | StringRef CurrentLinePrefix, bool IsAligned, |
| 43 | bool ContinuesPPDirective, bool IsInsideToken) |
| 44 | : Tok(&Tok), CreateReplacement(CreateReplacement), |
| 45 | OriginalWhitespaceRange(OriginalWhitespaceRange), |
| 46 | StartOfTokenColumn(StartOfTokenColumn), |
| 47 | IndentedFromColumn(IndentedFromColumn), NewlinesBefore(NewlinesBefore), |
| 48 | PreviousLinePostfix(PreviousLinePostfix), |
| 49 | CurrentLinePrefix(CurrentLinePrefix), IsAligned(IsAligned), |
| 50 | ContinuesPPDirective(ContinuesPPDirective), Spaces(Spaces), |
| 51 | IsInsideToken(IsInsideToken), IsTrailingComment(false), TokenLength(0), |
| 52 | PreviousEndOfTokenColumn(0), EscapedNewlineColumn(0), |
| 53 | StartOfBlockComment(nullptr), IndentationOffset(0), ConditionalsLevel(0) { |
| 54 | } |
| 55 | |
| 56 | void WhitespaceManager::replaceWhitespace(FormatToken &Tok, unsigned Newlines, |
| 57 | unsigned Spaces, |
| 58 | unsigned StartOfTokenColumn, |
| 59 | bool IsAligned, bool InPPDirective, |
| 60 | unsigned IndentedFromColumn) { |
| 61 | if (Tok.Finalized || (Tok.MacroCtx && Tok.MacroCtx->Role == MR_ExpandedArg)) |
| 62 | return; |
| 63 | Tok.setDecision((Newlines > 0) ? FD_Break : FD_Continue); |
| 64 | Changes.push_back(Elt: Change(Tok, /*CreateReplacement=*/true, Tok.WhitespaceRange, |
| 65 | Spaces, StartOfTokenColumn, IndentedFromColumn, |
| 66 | Newlines, "" , "" , IsAligned, |
| 67 | InPPDirective && !Tok.IsFirst, |
| 68 | /*IsInsideToken=*/false)); |
| 69 | } |
| 70 | |
| 71 | void WhitespaceManager::addUntouchableToken(const FormatToken &Tok, |
| 72 | bool InPPDirective) { |
| 73 | if (Tok.Finalized || (Tok.MacroCtx && Tok.MacroCtx->Role == MR_ExpandedArg)) |
| 74 | return; |
| 75 | Changes.push_back(Elt: Change( |
| 76 | Tok, /*CreateReplacement=*/false, Tok.WhitespaceRange, /*Spaces=*/0, |
| 77 | Tok.OriginalColumn, /*IndentedFromColumn=*/0, Tok.NewlinesBefore, "" , "" , |
| 78 | /*IsAligned=*/false, InPPDirective && !Tok.IsFirst, |
| 79 | /*IsInsideToken=*/false)); |
| 80 | } |
| 81 | |
| 82 | llvm::Error |
| 83 | WhitespaceManager::addReplacement(const tooling::Replacement &Replacement) { |
| 84 | return Replaces.add(R: Replacement); |
| 85 | } |
| 86 | |
| 87 | bool WhitespaceManager::inputUsesCRLF(StringRef Text, bool DefaultToCRLF) { |
| 88 | size_t LF = Text.count(C: '\n'); |
| 89 | size_t CR = Text.count(C: '\r') * 2; |
| 90 | return LF == CR ? DefaultToCRLF : CR > LF; |
| 91 | } |
| 92 | |
| 93 | void WhitespaceManager::replaceWhitespaceInToken( |
| 94 | const FormatToken &Tok, unsigned Offset, unsigned ReplaceChars, |
| 95 | StringRef PreviousPostfix, StringRef CurrentPrefix, bool InPPDirective, |
| 96 | unsigned Newlines, int Spaces) { |
| 97 | if (Tok.Finalized || (Tok.MacroCtx && Tok.MacroCtx->Role == MR_ExpandedArg)) |
| 98 | return; |
| 99 | SourceLocation Start = Tok.getStartOfNonWhitespace().getLocWithOffset(Offset); |
| 100 | Changes.push_back( |
| 101 | Elt: Change(Tok, /*CreateReplacement=*/true, |
| 102 | SourceRange(Start, Start.getLocWithOffset(Offset: ReplaceChars)), Spaces, |
| 103 | std::max(a: 0, b: Spaces), /*IndentedFromColumn=*/0, Newlines, |
| 104 | PreviousPostfix, CurrentPrefix, |
| 105 | /*IsAligned=*/true, InPPDirective && !Tok.IsFirst, |
| 106 | /*IsInsideToken=*/true)); |
| 107 | } |
| 108 | |
| 109 | const tooling::Replacements &WhitespaceManager::generateReplacements() { |
| 110 | if (Changes.empty()) |
| 111 | return Replaces; |
| 112 | |
| 113 | llvm::sort(C&: Changes, Comp: Change::IsBeforeInFile(SourceMgr)); |
| 114 | calculateLineBreakInformation(); |
| 115 | alignConsecutiveMacros(); |
| 116 | alignConsecutiveShortCaseStatements(/*IsExpr=*/true); |
| 117 | alignConsecutiveShortCaseStatements(/*IsExpr=*/false); |
| 118 | alignConsecutiveDeclarations(); |
| 119 | alignConsecutiveBitFields(); |
| 120 | alignConsecutiveAssignments(); |
| 121 | if (Style.isTableGen()) { |
| 122 | alignConsecutiveTableGenBreakingDAGArgColons(); |
| 123 | alignConsecutiveTableGenCondOperatorColons(); |
| 124 | alignConsecutiveTableGenDefinitions(); |
| 125 | } |
| 126 | alignChainedConditionals(); |
| 127 | alignTrailingComments(); |
| 128 | alignEscapedNewlines(); |
| 129 | alignArrayInitializers(); |
| 130 | generateChanges(); |
| 131 | |
| 132 | return Replaces; |
| 133 | } |
| 134 | |
| 135 | void WhitespaceManager::calculateLineBreakInformation() { |
| 136 | Changes[0].PreviousEndOfTokenColumn = 0; |
| 137 | Change *LastOutsideTokenChange = &Changes[0]; |
| 138 | for (unsigned I = 1, e = Changes.size(); I != e; ++I) { |
| 139 | auto &C = Changes[I]; |
| 140 | auto &P = Changes[I - 1]; |
| 141 | auto &PrevTokLength = P.TokenLength; |
| 142 | SourceLocation OriginalWhitespaceStart = |
| 143 | C.OriginalWhitespaceRange.getBegin(); |
| 144 | SourceLocation PreviousOriginalWhitespaceEnd = |
| 145 | P.OriginalWhitespaceRange.getEnd(); |
| 146 | unsigned OriginalWhitespaceStartOffset = |
| 147 | SourceMgr.getFileOffset(SpellingLoc: OriginalWhitespaceStart); |
| 148 | unsigned PreviousOriginalWhitespaceEndOffset = |
| 149 | SourceMgr.getFileOffset(SpellingLoc: PreviousOriginalWhitespaceEnd); |
| 150 | assert(PreviousOriginalWhitespaceEndOffset <= |
| 151 | OriginalWhitespaceStartOffset); |
| 152 | const char *const PreviousOriginalWhitespaceEndData = |
| 153 | SourceMgr.getCharacterData(SL: PreviousOriginalWhitespaceEnd); |
| 154 | StringRef Text(PreviousOriginalWhitespaceEndData, |
| 155 | SourceMgr.getCharacterData(SL: OriginalWhitespaceStart) - |
| 156 | PreviousOriginalWhitespaceEndData); |
| 157 | // Usually consecutive changes would occur in consecutive tokens. This is |
| 158 | // not the case however when analyzing some preprocessor runs of the |
| 159 | // annotated lines. For example, in this code: |
| 160 | // |
| 161 | // #if A // line 1 |
| 162 | // int i = 1; |
| 163 | // #else B // line 2 |
| 164 | // int i = 2; |
| 165 | // #endif // line 3 |
| 166 | // |
| 167 | // one of the runs will produce the sequence of lines marked with line 1, 2 |
| 168 | // and 3. So the two consecutive whitespace changes just before '// line 2' |
| 169 | // and before '#endif // line 3' span multiple lines and tokens: |
| 170 | // |
| 171 | // #else B{change X}[// line 2 |
| 172 | // int i = 2; |
| 173 | // ]{change Y}#endif // line 3 |
| 174 | // |
| 175 | // For this reason, if the text between consecutive changes spans multiple |
| 176 | // newlines, the token length must be adjusted to the end of the original |
| 177 | // line of the token. |
| 178 | auto NewlinePos = Text.find_first_of(C: '\n'); |
| 179 | if (NewlinePos == StringRef::npos) { |
| 180 | PrevTokLength = OriginalWhitespaceStartOffset - |
| 181 | PreviousOriginalWhitespaceEndOffset + |
| 182 | C.PreviousLinePostfix.size() + P.CurrentLinePrefix.size(); |
| 183 | if (!P.IsInsideToken) |
| 184 | PrevTokLength = std::min(a: PrevTokLength, b: P.Tok->ColumnWidth); |
| 185 | } else { |
| 186 | PrevTokLength = NewlinePos + P.CurrentLinePrefix.size(); |
| 187 | } |
| 188 | |
| 189 | // If there are multiple changes in this token, sum up all the changes until |
| 190 | // the end of the line. |
| 191 | if (P.IsInsideToken && P.NewlinesBefore == 0) |
| 192 | LastOutsideTokenChange->TokenLength += PrevTokLength + P.Spaces; |
| 193 | else |
| 194 | LastOutsideTokenChange = &P; |
| 195 | |
| 196 | C.PreviousEndOfTokenColumn = P.StartOfTokenColumn + PrevTokLength; |
| 197 | |
| 198 | P.IsTrailingComment = |
| 199 | (C.NewlinesBefore > 0 || C.Tok->is(Kind: tok::eof) || |
| 200 | (C.IsInsideToken && C.Tok->is(Kind: tok::comment))) && |
| 201 | P.Tok->is(Kind: tok::comment) && |
| 202 | // FIXME: This is a dirty hack. The problem is that |
| 203 | // BreakableLineCommentSection does comment reflow changes and here is |
| 204 | // the aligning of trailing comments. Consider the case where we reflow |
| 205 | // the second line up in this example: |
| 206 | // |
| 207 | // // line 1 |
| 208 | // // line 2 |
| 209 | // |
| 210 | // That amounts to 2 changes by BreakableLineCommentSection: |
| 211 | // - the first, delimited by (), for the whitespace between the tokens, |
| 212 | // - and second, delimited by [], for the whitespace at the beginning |
| 213 | // of the second token: |
| 214 | // |
| 215 | // // line 1( |
| 216 | // )[// ]line 2 |
| 217 | // |
| 218 | // So in the end we have two changes like this: |
| 219 | // |
| 220 | // // line1()[ ]line 2 |
| 221 | // |
| 222 | // Note that the OriginalWhitespaceStart of the second change is the |
| 223 | // same as the PreviousOriginalWhitespaceEnd of the first change. |
| 224 | // In this case, the below check ensures that the second change doesn't |
| 225 | // get treated as a trailing comment change here, since this might |
| 226 | // trigger additional whitespace to be wrongly inserted before "line 2" |
| 227 | // by the comment aligner here. |
| 228 | // |
| 229 | // For a proper solution we need a mechanism to say to WhitespaceManager |
| 230 | // that a particular change breaks the current sequence of trailing |
| 231 | // comments. |
| 232 | OriginalWhitespaceStart != PreviousOriginalWhitespaceEnd; |
| 233 | } |
| 234 | // FIXME: The last token is currently not always an eof token; in those |
| 235 | // cases, setting TokenLength of the last token to 0 is wrong. |
| 236 | Changes.back().TokenLength = 0; |
| 237 | Changes.back().IsTrailingComment = Changes.back().Tok->is(Kind: tok::comment); |
| 238 | |
| 239 | const WhitespaceManager::Change * = nullptr; |
| 240 | for (auto &Change : Changes) { |
| 241 | // Reset the IsTrailingComment flag for changes inside of trailing comments |
| 242 | // so they don't get realigned later. Comment line breaks however still need |
| 243 | // to be aligned. |
| 244 | if (Change.IsInsideToken && Change.NewlinesBefore == 0) |
| 245 | Change.IsTrailingComment = false; |
| 246 | Change.StartOfBlockComment = nullptr; |
| 247 | Change.IndentationOffset = 0; |
| 248 | if (Change.Tok->is(Kind: tok::comment)) { |
| 249 | if (Change.Tok->is(TT: TT_LineComment) || !Change.IsInsideToken) { |
| 250 | LastBlockComment = &Change; |
| 251 | } else if ((Change.StartOfBlockComment = LastBlockComment)) { |
| 252 | Change.IndentationOffset = |
| 253 | Change.StartOfTokenColumn - |
| 254 | Change.StartOfBlockComment->StartOfTokenColumn; |
| 255 | } |
| 256 | } else { |
| 257 | LastBlockComment = nullptr; |
| 258 | } |
| 259 | } |
| 260 | |
| 261 | // Compute conditional nesting level |
| 262 | // Level is increased for each conditional, unless this conditional continues |
| 263 | // a chain of conditional, i.e. starts immediately after the colon of another |
| 264 | // conditional. |
| 265 | SmallVector<bool, 16> ScopeStack; |
| 266 | int ConditionalsLevel = 0; |
| 267 | for (auto &Change : Changes) { |
| 268 | for (unsigned i = 0, e = Change.Tok->FakeLParens.size(); i != e; ++i) { |
| 269 | bool isNestedConditional = |
| 270 | Change.Tok->FakeLParens[e - 1 - i] == prec::Conditional && |
| 271 | !(i == 0 && Change.Tok->Previous && |
| 272 | Change.Tok->Previous->is(TT: TT_ConditionalExpr) && |
| 273 | Change.Tok->Previous->is(Kind: tok::colon)); |
| 274 | if (isNestedConditional) |
| 275 | ++ConditionalsLevel; |
| 276 | ScopeStack.push_back(Elt: isNestedConditional); |
| 277 | } |
| 278 | |
| 279 | Change.ConditionalsLevel = ConditionalsLevel; |
| 280 | |
| 281 | for (unsigned i = Change.Tok->FakeRParens; i > 0 && ScopeStack.size(); --i) |
| 282 | if (ScopeStack.pop_back_val()) |
| 283 | --ConditionalsLevel; |
| 284 | } |
| 285 | } |
| 286 | |
| 287 | // Align a single sequence of tokens, see AlignTokens below. |
| 288 | // Column - The tokens indexed in Matches are moved to this column. |
| 289 | // RightJustify - Whether it is the token's right end or left end that gets |
| 290 | // moved to that column. |
| 291 | static void |
| 292 | AlignTokenSequence(const FormatStyle &Style, unsigned Start, unsigned End, |
| 293 | unsigned Column, bool RightJustify, |
| 294 | ArrayRef<unsigned> Matches, |
| 295 | SmallVector<WhitespaceManager::Change, 16> &Changes) { |
| 296 | unsigned OriginalMatchColumn = 0; |
| 297 | int Shift = 0; |
| 298 | // Set when the shift is applied anywhere in the line. Cleared when the line |
| 299 | // ends. |
| 300 | bool LineShifted = false; |
| 301 | |
| 302 | // ScopeStack keeps track of the current scope depth. It contains the levels |
| 303 | // of at most 2 scopes. The first one is the one that the matched token is |
| 304 | // in. The second one is the one that should not be moved by this procedure. |
| 305 | // The "Matches" indices should only have tokens from the outer-most scope. |
| 306 | // However, we do need to pay special attention to one class of tokens |
| 307 | // that are not in the outer-most scope, and that is the continuations of an |
| 308 | // unwrapped line whose positions are derived from a token to the right of the |
| 309 | // aligned token, as illustrated by this example: |
| 310 | // double a(int x); |
| 311 | // int b(int y, |
| 312 | // double z); |
| 313 | // In the above example, we need to take special care to ensure that |
| 314 | // 'double z' is indented along with its owning function 'b', because its |
| 315 | // position is derived from the '(' token to the right of the 'b' token. |
| 316 | // The same holds for calling a function: |
| 317 | // double a = foo(x); |
| 318 | // int b = bar(foo(y), |
| 319 | // foor(z)); |
| 320 | // Similar for broken string literals: |
| 321 | // double x = 3.14; |
| 322 | // auto s = "Hello" |
| 323 | // "World"; |
| 324 | // Special handling is required for 'nested' ternary operators. |
| 325 | SmallVector<std::tuple<unsigned, unsigned, unsigned>, 2> ScopeStack; |
| 326 | |
| 327 | for (unsigned i = Start; i != End; ++i) { |
| 328 | auto &CurrentChange = Changes[i]; |
| 329 | if (!Matches.empty() && Matches[0] < i) |
| 330 | Matches.consume_front(); |
| 331 | assert(Matches.empty() || Matches[0] >= i); |
| 332 | while (!ScopeStack.empty() && |
| 333 | CurrentChange.indentAndNestingLevel() < ScopeStack.back()) { |
| 334 | ScopeStack.pop_back(); |
| 335 | } |
| 336 | |
| 337 | // Keep track of the level that should not move with the aligned token. |
| 338 | if (ScopeStack.size() == 1u && CurrentChange.NewlinesBefore != 0u && |
| 339 | CurrentChange.indentAndNestingLevel() > ScopeStack[0] && |
| 340 | CurrentChange.IndentedFromColumn < OriginalMatchColumn) { |
| 341 | ScopeStack.push_back(Elt: CurrentChange.indentAndNestingLevel()); |
| 342 | } |
| 343 | |
| 344 | bool InsideNestedScope = |
| 345 | !ScopeStack.empty() && |
| 346 | (CurrentChange.indentAndNestingLevel() > ScopeStack[0] || |
| 347 | (CurrentChange.indentAndNestingLevel() == ScopeStack[0] && |
| 348 | CurrentChange.IndentedFromColumn >= OriginalMatchColumn)); |
| 349 | |
| 350 | if (CurrentChange.NewlinesBefore > 0) { |
| 351 | LineShifted = false; |
| 352 | if (!InsideNestedScope) |
| 353 | Shift = 0; |
| 354 | } |
| 355 | |
| 356 | // If this is the first matching token to be aligned, remember by how many |
| 357 | // spaces it has to be shifted, so the rest of the changes on the line are |
| 358 | // shifted by the same amount |
| 359 | if (!Matches.empty() && Matches[0] == i) { |
| 360 | OriginalMatchColumn = CurrentChange.StartOfTokenColumn; |
| 361 | Shift = Column - (RightJustify ? CurrentChange.TokenLength : 0) - |
| 362 | CurrentChange.StartOfTokenColumn; |
| 363 | ScopeStack = {CurrentChange.indentAndNestingLevel()}; |
| 364 | } |
| 365 | |
| 366 | if (Shift == 0) |
| 367 | continue; |
| 368 | |
| 369 | // This is for lines that are split across multiple lines, as mentioned in |
| 370 | // the ScopeStack comment. The stack size being 1 means that the token is |
| 371 | // not in a scope that should not move. |
| 372 | if ((!Matches.empty() && Matches[0] == i) || |
| 373 | (ScopeStack.size() == 1u && CurrentChange.NewlinesBefore > 0 && |
| 374 | InsideNestedScope)) { |
| 375 | LineShifted = true; |
| 376 | CurrentChange.IndentedFromColumn += Shift; |
| 377 | CurrentChange.Spaces += Shift; |
| 378 | } |
| 379 | |
| 380 | // We should not remove required spaces unless we break the line before. |
| 381 | assert(Shift > 0 || Changes[i].NewlinesBefore > 0 || |
| 382 | CurrentChange.Spaces >= |
| 383 | static_cast<int>(Changes[i].Tok->SpacesRequiredBefore) || |
| 384 | CurrentChange.Tok->is(tok::eof)); |
| 385 | |
| 386 | if (LineShifted) { |
| 387 | CurrentChange.StartOfTokenColumn += Shift; |
| 388 | if (i + 1 != Changes.size()) |
| 389 | Changes[i + 1].PreviousEndOfTokenColumn += Shift; |
| 390 | } |
| 391 | |
| 392 | // If PointerAlignment is PAS_Right, keep *s or &s next to the token, |
| 393 | // except if the token is equal, then a space is needed. |
| 394 | if ((Style.PointerAlignment == FormatStyle::PAS_Right || |
| 395 | Style.ReferenceAlignment == FormatStyle::RAS_Right) && |
| 396 | CurrentChange.Spaces != 0 && |
| 397 | CurrentChange.Tok->isNoneOf(Ks: tok::equal, Ks: tok::r_paren, |
| 398 | Ks: TT_TemplateCloser)) { |
| 399 | const bool ReferenceNotRightAligned = |
| 400 | Style.ReferenceAlignment != FormatStyle::RAS_Right && |
| 401 | Style.ReferenceAlignment != FormatStyle::RAS_Pointer; |
| 402 | for (int Previous = i - 1; |
| 403 | Previous >= 0 && Changes[Previous].Tok->is(TT: TT_PointerOrReference); |
| 404 | --Previous) { |
| 405 | assert(Changes[Previous].Tok->isPointerOrReference()); |
| 406 | if (Changes[Previous].Tok->isNot(Kind: tok::star)) { |
| 407 | if (ReferenceNotRightAligned) |
| 408 | continue; |
| 409 | } else if (Style.PointerAlignment != FormatStyle::PAS_Right) { |
| 410 | continue; |
| 411 | } |
| 412 | Changes[Previous + 1].Spaces -= Shift; |
| 413 | Changes[Previous].Spaces += Shift; |
| 414 | Changes[Previous].StartOfTokenColumn += Shift; |
| 415 | } |
| 416 | } |
| 417 | } |
| 418 | } |
| 419 | |
| 420 | // Walk through a subset of the changes, starting at StartAt, and find |
| 421 | // sequences of matching tokens to align. To do so, keep track of the lines and |
| 422 | // whether or not a matching token was found on a line. If a matching token is |
| 423 | // found, extend the current sequence. If the current line cannot be part of a |
| 424 | // sequence, e.g. because there is an empty line before it or it contains only |
| 425 | // non-matching tokens, finalize the previous sequence. |
| 426 | // The value returned is the token on which we stopped, either because we |
| 427 | // exhausted all items inside Changes, or because we hit a scope level higher |
| 428 | // than our initial scope. |
| 429 | // This function is recursive. Each invocation processes only the scope level |
| 430 | // equal to the initial level, which is the level of Changes[StartAt]. |
| 431 | // If we encounter a scope level greater than the initial level, then we call |
| 432 | // ourselves recursively, thereby avoiding the pollution of the current state |
| 433 | // with the alignment requirements of the nested sub-level. This recursive |
| 434 | // behavior is necessary for aligning function prototypes that have one or more |
| 435 | // arguments. |
| 436 | // If this function encounters a scope level less than the initial level, |
| 437 | // it returns the current position. |
| 438 | // There is a non-obvious subtlety in the recursive behavior: Even though we |
| 439 | // defer processing of nested levels to recursive invocations of this |
| 440 | // function, when it comes time to align a sequence of tokens, we run the |
| 441 | // alignment on the entire sequence, including the nested levels. |
| 442 | // When doing so, most of the nested tokens are skipped, because their |
| 443 | // alignment was already handled by the recursive invocations of this function. |
| 444 | // However, the special exception is that we do NOT skip function parameters |
| 445 | // that are split across multiple lines. See the test case in FormatTest.cpp |
| 446 | // that mentions "split function parameter alignment" for an example of this. |
| 447 | // When the parameter RightJustify is true, the operator will be |
| 448 | // right-justified. It is used to align compound assignments like `+=` and `=`. |
| 449 | // When RightJustify and ACS.PadOperators are true, operators in each block to |
| 450 | // be aligned will be padded on the left to the same length before aligning. |
| 451 | // |
| 452 | // The simple check will not look at the indentaion and nesting level to recurse |
| 453 | // into the line for alignment. It will also not count the commas. This is e.g. |
| 454 | // for aligning macro definitions. |
| 455 | template <typename F, bool SimpleCheck = false> |
| 456 | static unsigned AlignTokens(const FormatStyle &Style, F &&Matches, |
| 457 | SmallVector<WhitespaceManager::Change, 16> &Changes, |
| 458 | unsigned StartAt, |
| 459 | const FormatStyle::AlignConsecutiveStyle &ACS = {}, |
| 460 | bool RightJustify = false) { |
| 461 | // We arrange each line in 3 parts. The operator to be aligned (the anchor), |
| 462 | // and text to its left and right. In the aligned text the width of each part |
| 463 | // will be the maximum of that over the block that has been aligned. |
| 464 | |
| 465 | // Maximum widths of each part so far. |
| 466 | // When RightJustify is true and ACS.PadOperators is false, the part from |
| 467 | // start of line to the right end of the anchor. Otherwise, only the part to |
| 468 | // the left of the anchor. Including the space that exists on its left from |
| 469 | // the start. Not including the padding added on the left to right-justify the |
| 470 | // anchor. |
| 471 | unsigned WidthLeft = 0; |
| 472 | // The operator to be aligned when RightJustify is true and ACS.PadOperators |
| 473 | // is false. 0 otherwise. |
| 474 | unsigned WidthAnchor = 0; |
| 475 | // Width to the right of the anchor. Plus width of the anchor when |
| 476 | // RightJustify is false. |
| 477 | unsigned WidthRight = 0; |
| 478 | |
| 479 | // Number of the start and the end of the current token sequence. |
| 480 | unsigned StartOfSequence = 0; |
| 481 | unsigned EndOfSequence = 0; |
| 482 | |
| 483 | // The positions of the tokens to be aligned. |
| 484 | SmallVector<unsigned> MatchedIndices; |
| 485 | |
| 486 | // Measure the scope level (i.e. depth of (), [], {}) of the first token, and |
| 487 | // abort when we hit any token in a higher scope than the starting one. |
| 488 | const auto IndentAndNestingLevel = |
| 489 | StartAt < Changes.size() ? Changes[StartAt].indentAndNestingLevel() |
| 490 | : std::tuple<unsigned, unsigned, unsigned>(); |
| 491 | |
| 492 | // Keep track of the number of commas before the matching tokens, we will only |
| 493 | // align a sequence of matching tokens if they are preceded by the same number |
| 494 | // of commas. |
| 495 | unsigned CommasBeforeLastMatch = 0; |
| 496 | unsigned CommasBeforeMatch = 0; |
| 497 | |
| 498 | // The column number of the matching token on the current line. |
| 499 | std::optional<unsigned> MatchingColumn; |
| 500 | |
| 501 | // Whether the current line consists purely of comments. |
| 502 | bool = true; |
| 503 | |
| 504 | // Aligns a sequence of matching tokens, on the MinColumn column. |
| 505 | // |
| 506 | // Sequences start from the first matching token to align, and end at the |
| 507 | // first token of the first line that doesn't need to be aligned. |
| 508 | // |
| 509 | // We need to adjust the StartOfTokenColumn of each Change that is on a line |
| 510 | // containing any matching token to be aligned and located after such token. |
| 511 | auto AlignCurrentSequence = [&] { |
| 512 | if (StartOfSequence > 0 && StartOfSequence < EndOfSequence) { |
| 513 | AlignTokenSequence(Style, Start: StartOfSequence, End: EndOfSequence, |
| 514 | Column: WidthLeft + WidthAnchor, RightJustify, Matches: MatchedIndices, |
| 515 | Changes); |
| 516 | } |
| 517 | WidthLeft = 0; |
| 518 | WidthAnchor = 0; |
| 519 | WidthRight = 0; |
| 520 | StartOfSequence = 0; |
| 521 | EndOfSequence = 0; |
| 522 | MatchedIndices.clear(); |
| 523 | }; |
| 524 | |
| 525 | unsigned I = StartAt; |
| 526 | const auto E = Changes.size(); |
| 527 | for (; I != E; ++I) { |
| 528 | auto &CurrentChange = Changes[I]; |
| 529 | if (CurrentChange.indentAndNestingLevel() < IndentAndNestingLevel) |
| 530 | break; |
| 531 | |
| 532 | if (CurrentChange.NewlinesBefore != 0) { |
| 533 | CommasBeforeMatch = 0; |
| 534 | EndOfSequence = I; |
| 535 | |
| 536 | // Whether to break the alignment sequence because of an empty line. |
| 537 | bool EmptyLineBreak = |
| 538 | (CurrentChange.NewlinesBefore > 1) && !ACS.AcrossEmptyLines; |
| 539 | |
| 540 | // Whether to break the alignment sequence because of a line without a |
| 541 | // match. |
| 542 | bool NoMatchBreak = |
| 543 | !MatchingColumn && !(LineIsComment && ACS.AcrossComments); |
| 544 | |
| 545 | if (EmptyLineBreak || NoMatchBreak) |
| 546 | AlignCurrentSequence(); |
| 547 | |
| 548 | // A new line starts, re-initialize line status tracking bools. |
| 549 | // Keep the match state if a string literal is continued on this line. |
| 550 | if (MatchingColumn && CurrentChange.IndentedFromColumn < *MatchingColumn) |
| 551 | MatchingColumn.reset(); |
| 552 | LineIsComment = true; |
| 553 | } |
| 554 | |
| 555 | if (CurrentChange.Tok->isNot(Kind: tok::comment)) |
| 556 | LineIsComment = false; |
| 557 | |
| 558 | if (!SimpleCheck) { |
| 559 | if (CurrentChange.Tok->is(Kind: tok::comma)) { |
| 560 | ++CommasBeforeMatch; |
| 561 | } else if (CurrentChange.indentAndNestingLevel() > |
| 562 | IndentAndNestingLevel) { |
| 563 | // Call AlignTokens recursively, skipping over this scope block. |
| 564 | const auto StoppedAt = |
| 565 | AlignTokens(Style, Matches, Changes, I, ACS, RightJustify); |
| 566 | I = StoppedAt - 1; |
| 567 | continue; |
| 568 | } |
| 569 | } |
| 570 | |
| 571 | if (!Matches(CurrentChange)) |
| 572 | continue; |
| 573 | |
| 574 | // If there is more than one matching token per line, or if the number of |
| 575 | // preceding commas, do not match anymore, end the sequence. |
| 576 | if ((CurrentChange.NewlinesBefore == 0U && MatchingColumn) || |
| 577 | CommasBeforeMatch != CommasBeforeLastMatch) { |
| 578 | MatchedIndices.push_back(Elt: I); |
| 579 | AlignCurrentSequence(); |
| 580 | } |
| 581 | |
| 582 | CommasBeforeLastMatch = CommasBeforeMatch; |
| 583 | MatchingColumn = CurrentChange.StartOfTokenColumn; |
| 584 | |
| 585 | if (StartOfSequence == 0) |
| 586 | StartOfSequence = I; |
| 587 | |
| 588 | unsigned ChangeWidthLeft = CurrentChange.StartOfTokenColumn; |
| 589 | unsigned ChangeWidthAnchor = 0; |
| 590 | unsigned ChangeWidthRight = 0; |
| 591 | unsigned CurrentChangeWidthRight = 0; |
| 592 | if (RightJustify) |
| 593 | if (ACS.PadOperators) |
| 594 | ChangeWidthAnchor = CurrentChange.TokenLength; |
| 595 | else |
| 596 | ChangeWidthLeft += CurrentChange.TokenLength; |
| 597 | else |
| 598 | CurrentChangeWidthRight = CurrentChange.TokenLength; |
| 599 | const FormatToken *MatchingParenToEncounter = nullptr; |
| 600 | for (unsigned J = I + 1; |
| 601 | J != E && (Changes[J].NewlinesBefore == 0 || |
| 602 | MatchingParenToEncounter || Changes[J].IsAligned); |
| 603 | ++J) { |
| 604 | const auto &Change = Changes[J]; |
| 605 | const auto *Tok = Change.Tok; |
| 606 | |
| 607 | if (Tok->MatchingParen) { |
| 608 | if (Tok->isOneOf(K1: tok::l_paren, K2: tok::l_brace, Ks: tok::l_square, |
| 609 | Ks: TT_TemplateOpener) && |
| 610 | !MatchingParenToEncounter) { |
| 611 | // If the next token is on the next line, we probably don't need to |
| 612 | // check the following lengths, because it most likely isn't aligned |
| 613 | // with the rest. |
| 614 | if (J + 1 != E && Changes[J + 1].NewlinesBefore == 0) |
| 615 | MatchingParenToEncounter = Tok->MatchingParen; |
| 616 | } else if (MatchingParenToEncounter == Tok->MatchingParen) { |
| 617 | MatchingParenToEncounter = nullptr; |
| 618 | } |
| 619 | } |
| 620 | |
| 621 | if (Change.NewlinesBefore != 0) { |
| 622 | ChangeWidthRight = std::max(a: ChangeWidthRight, b: CurrentChangeWidthRight); |
| 623 | const auto ChangeWidthStart = ChangeWidthLeft + ChangeWidthAnchor; |
| 624 | // If the position of the current token is columnwise before the begin |
| 625 | // of the alignment, we drop out here, because the next line does not |
| 626 | // have to be moved with the previous one(s) for the alignment. E.g.: |
| 627 | // int i1 = 1; | <- ColumnLimit | int i1 = 1; |
| 628 | // int j = 0; | Without the break -> | int j = 0; |
| 629 | // int k = bar( | We still want to align the = | int k = bar( |
| 630 | // argument1, | here, even if we can't move | argument1, |
| 631 | // argument2); | the following lines. | argument2); |
| 632 | if (Change.IndentedFromColumn < ChangeWidthStart) |
| 633 | break; |
| 634 | CurrentChangeWidthRight = Change.Spaces - ChangeWidthStart; |
| 635 | } else { |
| 636 | CurrentChangeWidthRight += Change.Spaces; |
| 637 | } |
| 638 | |
| 639 | // Changes are generally 1:1 with the tokens, but a change could also be |
| 640 | // inside of a token, in which case it's counted more than once: once for |
| 641 | // the whitespace surrounding the token (!IsInsideToken) and once for |
| 642 | // each whitespace change within it (IsInsideToken). |
| 643 | // Therefore, changes inside of a token should only count the space. |
| 644 | if (!Change.IsInsideToken) |
| 645 | CurrentChangeWidthRight += Change.TokenLength; |
| 646 | } |
| 647 | |
| 648 | ChangeWidthRight = std::max(a: ChangeWidthRight, b: CurrentChangeWidthRight); |
| 649 | |
| 650 | // If we are restricted by the maximum column width, end the sequence. |
| 651 | unsigned NewLeft = std::max(a: ChangeWidthLeft, b: WidthLeft); |
| 652 | unsigned NewAnchor = std::max(a: ChangeWidthAnchor, b: WidthAnchor); |
| 653 | unsigned NewRight = std::max(a: ChangeWidthRight, b: WidthRight); |
| 654 | // `ColumnLimit == 0` means there is no column limit. |
| 655 | if (Style.ColumnLimit != 0 && |
| 656 | Style.ColumnLimit < NewLeft + NewAnchor + NewRight) { |
| 657 | AlignCurrentSequence(); |
| 658 | StartOfSequence = I; |
| 659 | WidthLeft = ChangeWidthLeft; |
| 660 | WidthAnchor = ChangeWidthAnchor; |
| 661 | WidthRight = ChangeWidthRight; |
| 662 | } else { |
| 663 | WidthLeft = NewLeft; |
| 664 | WidthAnchor = NewAnchor; |
| 665 | WidthRight = NewRight; |
| 666 | } |
| 667 | MatchedIndices.push_back(Elt: I); |
| 668 | } |
| 669 | |
| 670 | // Pass entire lines to the function so that it can update the state of all |
| 671 | // tokens that move. |
| 672 | for (EndOfSequence = I; |
| 673 | EndOfSequence < E && Changes[EndOfSequence].NewlinesBefore == 0; |
| 674 | ++EndOfSequence) { |
| 675 | } |
| 676 | AlignCurrentSequence(); |
| 677 | // The return value should still be where the level ends. The rest of the line |
| 678 | // may contain stuff to be aligned within an outer level. |
| 679 | return I; |
| 680 | } |
| 681 | |
| 682 | // Aligns a sequence of matching tokens, on the MinColumn column. |
| 683 | // |
| 684 | // Sequences start from the first matching token to align, and end at the |
| 685 | // first token of the first line that doesn't need to be aligned. |
| 686 | // |
| 687 | // We need to adjust the StartOfTokenColumn of each Change that is on a line |
| 688 | // containing any matching token to be aligned and located after such token. |
| 689 | static void AlignMatchingTokenSequence( |
| 690 | unsigned &StartOfSequence, unsigned &EndOfSequence, unsigned &MinColumn, |
| 691 | std::function<bool(const WhitespaceManager::Change &C)> Matches, |
| 692 | SmallVector<WhitespaceManager::Change, 16> &Changes) { |
| 693 | if (StartOfSequence > 0 && StartOfSequence < EndOfSequence) { |
| 694 | bool FoundMatchOnLine = false; |
| 695 | int Shift = 0; |
| 696 | |
| 697 | for (unsigned I = StartOfSequence; I != EndOfSequence; ++I) { |
| 698 | if (Changes[I].NewlinesBefore > 0) { |
| 699 | Shift = 0; |
| 700 | FoundMatchOnLine = false; |
| 701 | } |
| 702 | |
| 703 | // If this is the first matching token to be aligned, remember by how many |
| 704 | // spaces it has to be shifted, so the rest of the changes on the line are |
| 705 | // shifted by the same amount. |
| 706 | if (!FoundMatchOnLine && Matches(Changes[I])) { |
| 707 | FoundMatchOnLine = true; |
| 708 | Shift = MinColumn - Changes[I].StartOfTokenColumn; |
| 709 | Changes[I].Spaces += Shift; |
| 710 | } |
| 711 | |
| 712 | assert(Shift >= 0); |
| 713 | Changes[I].StartOfTokenColumn += Shift; |
| 714 | if (I + 1 != Changes.size()) |
| 715 | Changes[I + 1].PreviousEndOfTokenColumn += Shift; |
| 716 | } |
| 717 | } |
| 718 | |
| 719 | MinColumn = 0; |
| 720 | StartOfSequence = 0; |
| 721 | EndOfSequence = 0; |
| 722 | } |
| 723 | |
| 724 | void WhitespaceManager::alignConsecutiveMacros() { |
| 725 | if (!Style.AlignConsecutiveMacros.Enabled) |
| 726 | return; |
| 727 | |
| 728 | auto AlignMacrosMatches = [](const Change &C) { |
| 729 | const FormatToken *Current = C.Tok; |
| 730 | assert(Current); |
| 731 | |
| 732 | if (Current->SpacesRequiredBefore == 0 || !Current->Previous) |
| 733 | return false; |
| 734 | |
| 735 | Current = Current->Previous; |
| 736 | |
| 737 | // If token is a ")", skip over the parameter list, to the |
| 738 | // token that precedes the "(" |
| 739 | if (Current->is(Kind: tok::r_paren)) { |
| 740 | const auto *MatchingParen = Current->MatchingParen; |
| 741 | // For a macro function, 0 spaces are required between the |
| 742 | // identifier and the lparen that opens the parameter list. |
| 743 | if (!MatchingParen || MatchingParen->SpacesRequiredBefore > 0 || |
| 744 | !MatchingParen->Previous) { |
| 745 | return false; |
| 746 | } |
| 747 | Current = MatchingParen->Previous; |
| 748 | } else if (Current->Next->SpacesRequiredBefore != 1) { |
| 749 | // For a simple macro, 1 space is required between the |
| 750 | // identifier and the first token of the defined value. |
| 751 | return false; |
| 752 | } |
| 753 | |
| 754 | return Current->endsSequence(K1: tok::identifier, Tokens: tok::pp_define); |
| 755 | }; |
| 756 | |
| 757 | AlignTokens<decltype(AlignMacrosMatches) &, /*SimpleCheck=*/true>( |
| 758 | Style, Matches&: AlignMacrosMatches, Changes, StartAt: 0, ACS: Style.AlignConsecutiveMacros); |
| 759 | } |
| 760 | |
| 761 | void WhitespaceManager::alignConsecutiveAssignments() { |
| 762 | if (!Style.AlignConsecutiveAssignments.Enabled) |
| 763 | return; |
| 764 | |
| 765 | AlignTokens( |
| 766 | Style, |
| 767 | Matches: [&](const Change &C) { |
| 768 | // Do not align on equal signs that are first on a line. |
| 769 | if (C.NewlinesBefore > 0) |
| 770 | return false; |
| 771 | |
| 772 | // Do not align on equal signs that are last on a line. |
| 773 | if (&C != &Changes.back() && (&C + 1)->NewlinesBefore > 0) |
| 774 | return false; |
| 775 | |
| 776 | // Do not align operator= overloads. |
| 777 | FormatToken *Previous = C.Tok->getPreviousNonComment(); |
| 778 | if (Previous && Previous->is(Kind: tok::kw_operator)) |
| 779 | return false; |
| 780 | |
| 781 | return Style.AlignConsecutiveAssignments.AlignCompound |
| 782 | ? C.Tok->getPrecedence() == prec::Assignment |
| 783 | : (C.Tok->is(Kind: tok::equal) || |
| 784 | // In Verilog the '<=' is not a compound assignment, thus |
| 785 | // it is aligned even when the AlignCompound option is not |
| 786 | // set. |
| 787 | (Style.isVerilog() && C.Tok->is(Kind: tok::lessequal) && |
| 788 | C.Tok->getPrecedence() == prec::Assignment)); |
| 789 | }, |
| 790 | Changes, /*StartAt=*/0, ACS: Style.AlignConsecutiveAssignments, |
| 791 | /*RightJustify=*/true); |
| 792 | } |
| 793 | |
| 794 | void WhitespaceManager::alignConsecutiveBitFields() { |
| 795 | alignConsecutiveColons(AlignStyle: Style.AlignConsecutiveBitFields, Type: TT_BitFieldColon); |
| 796 | } |
| 797 | |
| 798 | void WhitespaceManager::alignConsecutiveColons( |
| 799 | const FormatStyle::AlignConsecutiveStyle &AlignStyle, TokenType Type) { |
| 800 | if (!AlignStyle.Enabled) |
| 801 | return; |
| 802 | |
| 803 | AlignTokens( |
| 804 | Style, |
| 805 | Matches: [&](Change const &C) { |
| 806 | // Do not align on ':' that is first on a line. |
| 807 | if (C.NewlinesBefore > 0) |
| 808 | return false; |
| 809 | |
| 810 | // Do not align on ':' that is last on a line. |
| 811 | if (&C != &Changes.back() && (&C + 1)->NewlinesBefore > 0) |
| 812 | return false; |
| 813 | |
| 814 | return C.Tok->is(TT: Type); |
| 815 | }, |
| 816 | Changes, /*StartAt=*/0, ACS: AlignStyle); |
| 817 | } |
| 818 | |
| 819 | void WhitespaceManager::alignConsecutiveShortCaseStatements(bool IsExpr) { |
| 820 | if (!Style.AlignConsecutiveShortCaseStatements.Enabled || |
| 821 | !(IsExpr ? Style.AllowShortCaseExpressionOnASingleLine |
| 822 | : Style.AllowShortCaseLabelsOnASingleLine)) { |
| 823 | return; |
| 824 | } |
| 825 | |
| 826 | const auto Type = IsExpr ? TT_CaseLabelArrow : TT_CaseLabelColon; |
| 827 | const auto &Option = Style.AlignConsecutiveShortCaseStatements; |
| 828 | const bool AlignArrowOrColon = |
| 829 | IsExpr ? Option.AlignCaseArrows : Option.AlignCaseColons; |
| 830 | |
| 831 | auto Matches = [&](const Change &C) { |
| 832 | if (AlignArrowOrColon) |
| 833 | return C.Tok->is(TT: Type); |
| 834 | |
| 835 | // Ignore 'IsInsideToken' to allow matching trailing comments which |
| 836 | // need to be reflowed as that causes the token to appear in two |
| 837 | // different changes, which will cause incorrect alignment as we'll |
| 838 | // reflow early due to detecting multiple aligning tokens per line. |
| 839 | return !C.IsInsideToken && C.Tok->Previous && C.Tok->Previous->is(TT: Type); |
| 840 | }; |
| 841 | |
| 842 | unsigned MinColumn = 0; |
| 843 | |
| 844 | // Empty case statements don't break the alignment, but don't necessarily |
| 845 | // match our predicate, so we need to track their column so they can push out |
| 846 | // our alignment. |
| 847 | unsigned MinEmptyCaseColumn = 0; |
| 848 | |
| 849 | // Start and end of the token sequence we're processing. |
| 850 | unsigned StartOfSequence = 0; |
| 851 | unsigned EndOfSequence = 0; |
| 852 | |
| 853 | // Whether a matching token has been found on the current line. |
| 854 | bool FoundMatchOnLine = false; |
| 855 | |
| 856 | bool = true; |
| 857 | bool LineIsEmptyCase = false; |
| 858 | |
| 859 | unsigned I = 0; |
| 860 | for (unsigned E = Changes.size(); I != E; ++I) { |
| 861 | if (Changes[I].NewlinesBefore != 0) { |
| 862 | // Whether to break the alignment sequence because of an empty line. |
| 863 | bool EmptyLineBreak = |
| 864 | (Changes[I].NewlinesBefore > 1) && |
| 865 | !Style.AlignConsecutiveShortCaseStatements.AcrossEmptyLines; |
| 866 | |
| 867 | // Whether to break the alignment sequence because of a line without a |
| 868 | // match. |
| 869 | bool NoMatchBreak = |
| 870 | !FoundMatchOnLine && |
| 871 | !(LineIsComment && |
| 872 | Style.AlignConsecutiveShortCaseStatements.AcrossComments) && |
| 873 | !LineIsEmptyCase; |
| 874 | |
| 875 | if (EmptyLineBreak || NoMatchBreak) { |
| 876 | AlignMatchingTokenSequence(StartOfSequence, EndOfSequence, MinColumn, |
| 877 | Matches, Changes); |
| 878 | MinEmptyCaseColumn = 0; |
| 879 | } |
| 880 | |
| 881 | // A new line starts, re-initialize line status tracking bools. |
| 882 | FoundMatchOnLine = false; |
| 883 | LineIsComment = true; |
| 884 | LineIsEmptyCase = false; |
| 885 | } |
| 886 | |
| 887 | if (Changes[I].Tok->isNot(Kind: tok::comment)) |
| 888 | LineIsComment = false; |
| 889 | |
| 890 | if (Changes[I].Tok->is(TT: Type)) { |
| 891 | LineIsEmptyCase = |
| 892 | !Changes[I].Tok->Next || Changes[I].Tok->Next->isTrailingComment(); |
| 893 | |
| 894 | if (LineIsEmptyCase) { |
| 895 | if (Style.AlignConsecutiveShortCaseStatements.AlignCaseColons) { |
| 896 | MinEmptyCaseColumn = |
| 897 | std::max(a: MinEmptyCaseColumn, b: Changes[I].StartOfTokenColumn); |
| 898 | } else { |
| 899 | MinEmptyCaseColumn = |
| 900 | std::max(a: MinEmptyCaseColumn, b: Changes[I].StartOfTokenColumn + 2); |
| 901 | } |
| 902 | } |
| 903 | } |
| 904 | |
| 905 | if (!Matches(Changes[I])) |
| 906 | continue; |
| 907 | |
| 908 | if (LineIsEmptyCase) |
| 909 | continue; |
| 910 | |
| 911 | FoundMatchOnLine = true; |
| 912 | |
| 913 | if (StartOfSequence == 0) |
| 914 | StartOfSequence = I; |
| 915 | |
| 916 | EndOfSequence = I + 1; |
| 917 | |
| 918 | MinColumn = std::max(a: MinColumn, b: Changes[I].StartOfTokenColumn); |
| 919 | |
| 920 | // Allow empty case statements to push out our alignment. |
| 921 | MinColumn = std::max(a: MinColumn, b: MinEmptyCaseColumn); |
| 922 | } |
| 923 | |
| 924 | AlignMatchingTokenSequence(StartOfSequence, EndOfSequence, MinColumn, Matches, |
| 925 | Changes); |
| 926 | } |
| 927 | |
| 928 | void WhitespaceManager::alignConsecutiveTableGenBreakingDAGArgColons() { |
| 929 | alignConsecutiveColons(AlignStyle: Style.AlignConsecutiveTableGenBreakingDAGArgColons, |
| 930 | Type: TT_TableGenDAGArgListColonToAlign); |
| 931 | } |
| 932 | |
| 933 | void WhitespaceManager::alignConsecutiveTableGenCondOperatorColons() { |
| 934 | alignConsecutiveColons(AlignStyle: Style.AlignConsecutiveTableGenCondOperatorColons, |
| 935 | Type: TT_TableGenCondOperatorColon); |
| 936 | } |
| 937 | |
| 938 | void WhitespaceManager::alignConsecutiveTableGenDefinitions() { |
| 939 | alignConsecutiveColons(AlignStyle: Style.AlignConsecutiveTableGenDefinitionColons, |
| 940 | Type: TT_InheritanceColon); |
| 941 | } |
| 942 | |
| 943 | void WhitespaceManager::alignConsecutiveDeclarations() { |
| 944 | if (!Style.AlignConsecutiveDeclarations.Enabled) |
| 945 | return; |
| 946 | |
| 947 | AlignTokens( |
| 948 | Style, |
| 949 | Matches: [&](Change const &C) { |
| 950 | if (C.Tok->is(TT: TT_FunctionTypeLParen)) |
| 951 | return Style.AlignConsecutiveDeclarations.AlignFunctionPointers; |
| 952 | if (C.Tok->is(TT: TT_FunctionDeclarationName)) |
| 953 | return Style.AlignConsecutiveDeclarations.AlignFunctionDeclarations; |
| 954 | if (C.Tok->isNot(Kind: TT_StartOfName)) |
| 955 | return false; |
| 956 | if (C.Tok->Previous && |
| 957 | C.Tok->Previous->is(TT: TT_StatementAttributeLikeMacro)) |
| 958 | return false; |
| 959 | // Check if there is a subsequent name that starts the same declaration. |
| 960 | for (FormatToken *Next = C.Tok->Next; Next; Next = Next->Next) { |
| 961 | if (Next->is(Kind: tok::comment)) |
| 962 | continue; |
| 963 | if (Next->is(TT: TT_PointerOrReference)) |
| 964 | return false; |
| 965 | if (!Next->Tok.getIdentifierInfo()) |
| 966 | break; |
| 967 | if (Next->isOneOf(K1: TT_StartOfName, K2: TT_FunctionDeclarationName, |
| 968 | Ks: tok::kw_operator)) { |
| 969 | return false; |
| 970 | } |
| 971 | } |
| 972 | return true; |
| 973 | }, |
| 974 | Changes, /*StartAt=*/0, ACS: Style.AlignConsecutiveDeclarations); |
| 975 | } |
| 976 | |
| 977 | void WhitespaceManager::alignChainedConditionals() { |
| 978 | if (Style.BreakBeforeTernaryOperators) { |
| 979 | AlignTokens( |
| 980 | Style, |
| 981 | Matches: [](Change const &C) { |
| 982 | // Align question operators and last colon |
| 983 | return C.Tok->is(TT: TT_ConditionalExpr) && |
| 984 | ((C.Tok->is(Kind: tok::question) && !C.NewlinesBefore) || |
| 985 | (C.Tok->is(Kind: tok::colon) && C.Tok->Next && |
| 986 | (C.Tok->Next->FakeLParens.empty() || |
| 987 | C.Tok->Next->FakeLParens.back() != prec::Conditional))); |
| 988 | }, |
| 989 | Changes, /*StartAt=*/0); |
| 990 | } else { |
| 991 | static auto AlignWrappedOperand = [](Change const &C) { |
| 992 | FormatToken *Previous = C.Tok->getPreviousNonComment(); |
| 993 | return C.NewlinesBefore && Previous && Previous->is(TT: TT_ConditionalExpr) && |
| 994 | (Previous->is(Kind: tok::colon) && |
| 995 | (C.Tok->FakeLParens.empty() || |
| 996 | C.Tok->FakeLParens.back() != prec::Conditional)); |
| 997 | }; |
| 998 | // Ensure we keep alignment of wrapped operands with non-wrapped operands |
| 999 | // Since we actually align the operators, the wrapped operands need the |
| 1000 | // extra offset to be properly aligned. |
| 1001 | for (Change &C : Changes) |
| 1002 | if (AlignWrappedOperand(C)) |
| 1003 | C.StartOfTokenColumn -= 2; |
| 1004 | AlignTokens( |
| 1005 | Style, |
| 1006 | Matches: [this](Change const &C) { |
| 1007 | // Align question operators if next operand is not wrapped, as |
| 1008 | // well as wrapped operands after question operator or last |
| 1009 | // colon in conditional sequence |
| 1010 | return (C.Tok->is(TT: TT_ConditionalExpr) && C.Tok->is(Kind: tok::question) && |
| 1011 | &C != &Changes.back() && (&C + 1)->NewlinesBefore == 0 && |
| 1012 | !(&C + 1)->IsTrailingComment) || |
| 1013 | AlignWrappedOperand(C); |
| 1014 | }, |
| 1015 | Changes, /*StartAt=*/0); |
| 1016 | } |
| 1017 | } |
| 1018 | |
| 1019 | void WhitespaceManager::() { |
| 1020 | if (Style.AlignTrailingComments.Kind == FormatStyle::TCAS_Never) |
| 1021 | return; |
| 1022 | |
| 1023 | const int Size = Changes.size(); |
| 1024 | if (Size == 0) |
| 1025 | return; |
| 1026 | |
| 1027 | int MinColumn = 0; |
| 1028 | int StartOfSequence = 0; |
| 1029 | bool BreakBeforeNext = false; |
| 1030 | bool IsInPP = Changes.front().Tok->Tok.is(K: tok::hash); |
| 1031 | int NewLineThreshold = 1; |
| 1032 | if (Style.AlignTrailingComments.Kind == FormatStyle::TCAS_Always) |
| 1033 | NewLineThreshold = Style.AlignTrailingComments.OverEmptyLines + 1; |
| 1034 | |
| 1035 | for (int I = 0, MaxColumn = INT_MAX, Newlines = 0; I < Size; ++I) { |
| 1036 | auto &C = Changes[I]; |
| 1037 | if (C.StartOfBlockComment) |
| 1038 | continue; |
| 1039 | if (C.NewlinesBefore != 0) { |
| 1040 | Newlines += C.NewlinesBefore; |
| 1041 | const bool WasInPP = std::exchange( |
| 1042 | obj&: IsInPP, new_val: C.Tok->Tok.is(K: tok::hash) || (IsInPP && C.IsTrailingComment) || |
| 1043 | C.ContinuesPPDirective); |
| 1044 | if (IsInPP != WasInPP && !Style.AlignTrailingComments.AlignPPAndNotPP) { |
| 1045 | alignTrailingComments(Start: StartOfSequence, End: I, Column: MinColumn); |
| 1046 | MinColumn = 0; |
| 1047 | MaxColumn = INT_MAX; |
| 1048 | StartOfSequence = I; |
| 1049 | Newlines = 0; |
| 1050 | } |
| 1051 | } |
| 1052 | if (!C.IsTrailingComment) |
| 1053 | continue; |
| 1054 | |
| 1055 | if (Style.AlignTrailingComments.Kind == FormatStyle::TCAS_Leave) { |
| 1056 | const int OriginalSpaces = |
| 1057 | C.OriginalWhitespaceRange.getEnd().getRawEncoding() - |
| 1058 | C.OriginalWhitespaceRange.getBegin().getRawEncoding() - |
| 1059 | C.Tok->LastNewlineOffset; |
| 1060 | assert(OriginalSpaces >= 0); |
| 1061 | const auto RestoredLineLength = |
| 1062 | C.StartOfTokenColumn + C.TokenLength + OriginalSpaces; |
| 1063 | // If leaving comments makes the line exceed the column limit, give up to |
| 1064 | // leave the comments. |
| 1065 | if (RestoredLineLength >= Style.ColumnLimit && Style.ColumnLimit > 0) |
| 1066 | break; |
| 1067 | C.Spaces = C.NewlinesBefore > 0 ? C.Tok->OriginalColumn : OriginalSpaces; |
| 1068 | continue; |
| 1069 | } |
| 1070 | |
| 1071 | const int ChangeMinColumn = C.StartOfTokenColumn; |
| 1072 | int ChangeMaxColumn; |
| 1073 | |
| 1074 | // If we don't create a replacement for this change, we have to consider |
| 1075 | // it to be immovable. |
| 1076 | if (!C.CreateReplacement) |
| 1077 | ChangeMaxColumn = ChangeMinColumn; |
| 1078 | else if (Style.ColumnLimit == 0) |
| 1079 | ChangeMaxColumn = INT_MAX; |
| 1080 | else if (Style.ColumnLimit >= C.TokenLength) |
| 1081 | ChangeMaxColumn = Style.ColumnLimit - C.TokenLength; |
| 1082 | else |
| 1083 | ChangeMaxColumn = ChangeMinColumn; |
| 1084 | |
| 1085 | if (I + 1 < Size && Changes[I + 1].ContinuesPPDirective && |
| 1086 | ChangeMaxColumn >= 2) { |
| 1087 | ChangeMaxColumn -= 2; |
| 1088 | } |
| 1089 | |
| 1090 | bool WasAlignedWithStartOfNextLine = false; |
| 1091 | if (C.NewlinesBefore >= 1) { // A comment on its own line. |
| 1092 | const auto CommentColumn = |
| 1093 | SourceMgr.getSpellingColumnNumber(Loc: C.OriginalWhitespaceRange.getEnd()); |
| 1094 | for (int J = I + 1; J < Size; ++J) { |
| 1095 | if (Changes[J].Tok->is(Kind: tok::comment)) |
| 1096 | continue; |
| 1097 | |
| 1098 | const auto NextColumn = SourceMgr.getSpellingColumnNumber( |
| 1099 | Loc: Changes[J].OriginalWhitespaceRange.getEnd()); |
| 1100 | // The start of the next token was previously aligned with the |
| 1101 | // start of this comment. |
| 1102 | WasAlignedWithStartOfNextLine = |
| 1103 | CommentColumn == NextColumn || |
| 1104 | CommentColumn == NextColumn + Style.IndentWidth; |
| 1105 | break; |
| 1106 | } |
| 1107 | } |
| 1108 | |
| 1109 | // We don't want to align comments which end a scope, which are here |
| 1110 | // identified by most closing braces. |
| 1111 | auto = [](const auto *Tok) { |
| 1112 | if (Tok->is(tok::semi)) { |
| 1113 | Tok = Tok->getPreviousNonComment(); |
| 1114 | if (!Tok) |
| 1115 | return false; |
| 1116 | } |
| 1117 | if (Tok->is(tok::r_paren)) { |
| 1118 | // Back up past the parentheses and a `TT_DoWhile` that may precede. |
| 1119 | Tok = Tok->MatchingParen; |
| 1120 | if (!Tok) |
| 1121 | return false; |
| 1122 | Tok = Tok->getPreviousNonComment(); |
| 1123 | if (!Tok) |
| 1124 | return false; |
| 1125 | if (Tok->is(TT_DoWhile)) { |
| 1126 | const auto *Prev = Tok->getPreviousNonComment(); |
| 1127 | if (!Prev) { |
| 1128 | // A do-while-loop without braces. |
| 1129 | return true; |
| 1130 | } |
| 1131 | Tok = Prev; |
| 1132 | } |
| 1133 | } |
| 1134 | |
| 1135 | if (Tok->isNot(tok::r_brace)) |
| 1136 | return false; |
| 1137 | |
| 1138 | while (Tok->Previous && Tok->Previous->is(tok::r_brace)) |
| 1139 | Tok = Tok->Previous; |
| 1140 | return Tok->NewlinesBefore > 0; |
| 1141 | }; |
| 1142 | |
| 1143 | if (I > 0 && C.NewlinesBefore == 0 && |
| 1144 | DontAlignThisComment(Changes[I - 1].Tok)) { |
| 1145 | alignTrailingComments(Start: StartOfSequence, End: I, Column: MinColumn); |
| 1146 | // Reset to initial values, but skip this change for the next alignment |
| 1147 | // pass. |
| 1148 | MinColumn = 0; |
| 1149 | MaxColumn = INT_MAX; |
| 1150 | StartOfSequence = I + 1; |
| 1151 | } else if (BreakBeforeNext || Newlines > NewLineThreshold || |
| 1152 | (ChangeMinColumn > MaxColumn || ChangeMaxColumn < MinColumn) || |
| 1153 | // Break the comment sequence if the previous line did not end |
| 1154 | // in a trailing comment. |
| 1155 | (C.NewlinesBefore == 1 && I > 0 && |
| 1156 | !Changes[I - 1].IsTrailingComment) || |
| 1157 | WasAlignedWithStartOfNextLine) { |
| 1158 | alignTrailingComments(Start: StartOfSequence, End: I, Column: MinColumn); |
| 1159 | MinColumn = ChangeMinColumn; |
| 1160 | MaxColumn = ChangeMaxColumn; |
| 1161 | StartOfSequence = I; |
| 1162 | } else { |
| 1163 | MinColumn = std::max(a: MinColumn, b: ChangeMinColumn); |
| 1164 | MaxColumn = std::min(a: MaxColumn, b: ChangeMaxColumn); |
| 1165 | } |
| 1166 | BreakBeforeNext = (I == 0) || (C.NewlinesBefore > 1) || |
| 1167 | // Never start a sequence with a comment at the beginning |
| 1168 | // of the line. |
| 1169 | (C.NewlinesBefore == 1 && StartOfSequence == I); |
| 1170 | Newlines = 0; |
| 1171 | } |
| 1172 | alignTrailingComments(Start: StartOfSequence, End: Size, Column: MinColumn); |
| 1173 | } |
| 1174 | |
| 1175 | void WhitespaceManager::(unsigned Start, unsigned End, |
| 1176 | unsigned Column) { |
| 1177 | for (unsigned i = Start; i != End; ++i) { |
| 1178 | int Shift = 0; |
| 1179 | if (Changes[i].IsTrailingComment) |
| 1180 | Shift = Column - Changes[i].StartOfTokenColumn; |
| 1181 | if (Changes[i].StartOfBlockComment) { |
| 1182 | Shift = Changes[i].IndentationOffset + |
| 1183 | Changes[i].StartOfBlockComment->StartOfTokenColumn - |
| 1184 | Changes[i].StartOfTokenColumn; |
| 1185 | } |
| 1186 | if (Shift <= 0) |
| 1187 | continue; |
| 1188 | Changes[i].Spaces += Shift; |
| 1189 | if (i + 1 != Changes.size()) |
| 1190 | Changes[i + 1].PreviousEndOfTokenColumn += Shift; |
| 1191 | Changes[i].StartOfTokenColumn += Shift; |
| 1192 | } |
| 1193 | } |
| 1194 | |
| 1195 | void WhitespaceManager::alignEscapedNewlines() { |
| 1196 | const auto Align = Style.AlignEscapedNewlines; |
| 1197 | if (Align == FormatStyle::ENAS_DontAlign) |
| 1198 | return; |
| 1199 | |
| 1200 | const bool WithLastLine = Align == FormatStyle::ENAS_LeftWithLastLine; |
| 1201 | const bool AlignLeft = Align == FormatStyle::ENAS_Left || WithLastLine; |
| 1202 | const auto MaxColumn = Style.ColumnLimit; |
| 1203 | unsigned MaxEndOfLine = AlignLeft ? 0 : MaxColumn; |
| 1204 | unsigned StartOfMacro = 0; |
| 1205 | for (unsigned i = 1, e = Changes.size(); i < e; ++i) { |
| 1206 | Change &C = Changes[i]; |
| 1207 | if (C.NewlinesBefore == 0 && (!WithLastLine || C.Tok->isNot(Kind: tok::eof))) |
| 1208 | continue; |
| 1209 | const bool InPPDirective = C.ContinuesPPDirective; |
| 1210 | const auto BackslashColumn = C.PreviousEndOfTokenColumn + 2; |
| 1211 | if (InPPDirective || |
| 1212 | (WithLastLine && (MaxColumn == 0 || BackslashColumn <= MaxColumn))) { |
| 1213 | MaxEndOfLine = std::max(a: BackslashColumn, b: MaxEndOfLine); |
| 1214 | } |
| 1215 | if (!InPPDirective) { |
| 1216 | alignEscapedNewlines(Start: StartOfMacro + 1, End: i, Column: MaxEndOfLine); |
| 1217 | MaxEndOfLine = AlignLeft ? 0 : MaxColumn; |
| 1218 | StartOfMacro = i; |
| 1219 | } |
| 1220 | } |
| 1221 | alignEscapedNewlines(Start: StartOfMacro + 1, End: Changes.size(), Column: MaxEndOfLine); |
| 1222 | } |
| 1223 | |
| 1224 | void WhitespaceManager::alignEscapedNewlines(unsigned Start, unsigned End, |
| 1225 | unsigned Column) { |
| 1226 | for (unsigned i = Start; i < End; ++i) { |
| 1227 | Change &C = Changes[i]; |
| 1228 | if (C.NewlinesBefore > 0) { |
| 1229 | assert(C.ContinuesPPDirective); |
| 1230 | if (C.PreviousEndOfTokenColumn + 1 > Column) |
| 1231 | C.EscapedNewlineColumn = 0; |
| 1232 | else |
| 1233 | C.EscapedNewlineColumn = Column; |
| 1234 | } |
| 1235 | } |
| 1236 | } |
| 1237 | |
| 1238 | void WhitespaceManager::alignArrayInitializers() { |
| 1239 | if (Style.AlignArrayOfStructures == FormatStyle::AIAS_None) |
| 1240 | return; |
| 1241 | |
| 1242 | for (unsigned ChangeIndex = 1U, ChangeEnd = Changes.size(); |
| 1243 | ChangeIndex < ChangeEnd; ++ChangeIndex) { |
| 1244 | auto &C = Changes[ChangeIndex]; |
| 1245 | if (C.Tok->IsArrayInitializer) { |
| 1246 | bool FoundComplete = false; |
| 1247 | for (unsigned InsideIndex = ChangeIndex + 1; InsideIndex < ChangeEnd; |
| 1248 | ++InsideIndex) { |
| 1249 | const auto *Tok = Changes[InsideIndex].Tok; |
| 1250 | if (Tok->is(Kind: tok::pp_define)) |
| 1251 | break; |
| 1252 | if (Tok == C.Tok->MatchingParen) { |
| 1253 | alignArrayInitializers(Start: ChangeIndex, End: InsideIndex + 1); |
| 1254 | ChangeIndex = InsideIndex + 1; |
| 1255 | FoundComplete = true; |
| 1256 | break; |
| 1257 | } |
| 1258 | } |
| 1259 | if (!FoundComplete) |
| 1260 | ChangeIndex = ChangeEnd; |
| 1261 | } |
| 1262 | } |
| 1263 | } |
| 1264 | |
| 1265 | void WhitespaceManager::alignArrayInitializers(unsigned Start, unsigned End) { |
| 1266 | |
| 1267 | if (Style.AlignArrayOfStructures == FormatStyle::AIAS_Right) |
| 1268 | alignArrayInitializersRightJustified(CellDescs: getCells(Start, End)); |
| 1269 | else if (Style.AlignArrayOfStructures == FormatStyle::AIAS_Left) |
| 1270 | alignArrayInitializersLeftJustified(CellDescs: getCells(Start, End)); |
| 1271 | } |
| 1272 | |
| 1273 | void WhitespaceManager::alignArrayInitializersRightJustified( |
| 1274 | CellDescriptions &&CellDescs) { |
| 1275 | if (!CellDescs.isRectangular()) |
| 1276 | return; |
| 1277 | |
| 1278 | const int BracePadding = |
| 1279 | Style.Cpp11BracedListStyle != FormatStyle::BLS_Block ? 0 : 1; |
| 1280 | auto &Cells = CellDescs.Cells; |
| 1281 | // Now go through and fixup the spaces. |
| 1282 | auto *CellIter = Cells.begin(); |
| 1283 | for (auto i = 0U; i < CellDescs.CellCounts[0]; ++i, ++CellIter) { |
| 1284 | unsigned NetWidth = 0U; |
| 1285 | if (isSplitCell(Cell: *CellIter)) |
| 1286 | NetWidth = getNetWidth(Start: Cells.begin(), End: CellIter, InitialSpaces: CellDescs.InitialSpaces); |
| 1287 | auto CellWidth = getMaximumCellWidth(CellIter, NetWidth); |
| 1288 | |
| 1289 | if (Changes[CellIter->Index].Tok->is(Kind: tok::r_brace)) { |
| 1290 | // So in here we want to see if there is a brace that falls |
| 1291 | // on a line that was split. If so on that line we make sure that |
| 1292 | // the spaces in front of the brace are enough. |
| 1293 | const auto *Next = CellIter; |
| 1294 | do { |
| 1295 | const FormatToken *Previous = Changes[Next->Index].Tok->Previous; |
| 1296 | if (Previous && Previous->isNot(Kind: TT_LineComment)) { |
| 1297 | Changes[Next->Index].Spaces = BracePadding; |
| 1298 | Changes[Next->Index].NewlinesBefore = 0; |
| 1299 | } |
| 1300 | Next = Next->NextColumnElement; |
| 1301 | } while (Next); |
| 1302 | // Unless the array is empty, we need the position of all the |
| 1303 | // immediately adjacent cells |
| 1304 | if (CellIter != Cells.begin()) { |
| 1305 | auto ThisNetWidth = |
| 1306 | getNetWidth(Start: Cells.begin(), End: CellIter, InitialSpaces: CellDescs.InitialSpaces); |
| 1307 | auto MaxNetWidth = getMaximumNetWidth( |
| 1308 | CellStart: Cells.begin(), CellStop: CellIter, InitialSpaces: CellDescs.InitialSpaces, |
| 1309 | CellCount: CellDescs.CellCounts[0], MaxRowCount: CellDescs.CellCounts.size()); |
| 1310 | if (ThisNetWidth < MaxNetWidth) |
| 1311 | Changes[CellIter->Index].Spaces = (MaxNetWidth - ThisNetWidth); |
| 1312 | auto RowCount = 1U; |
| 1313 | auto Offset = std::distance(first: Cells.begin(), last: CellIter); |
| 1314 | for (const auto *Next = CellIter->NextColumnElement; Next; |
| 1315 | Next = Next->NextColumnElement) { |
| 1316 | if (RowCount >= CellDescs.CellCounts.size()) |
| 1317 | break; |
| 1318 | auto *Start = (Cells.begin() + RowCount * CellDescs.CellCounts[0]); |
| 1319 | auto *End = Start + Offset; |
| 1320 | ThisNetWidth = getNetWidth(Start, End, InitialSpaces: CellDescs.InitialSpaces); |
| 1321 | if (ThisNetWidth < MaxNetWidth) |
| 1322 | Changes[Next->Index].Spaces = (MaxNetWidth - ThisNetWidth); |
| 1323 | ++RowCount; |
| 1324 | } |
| 1325 | } |
| 1326 | } else { |
| 1327 | auto ThisWidth = |
| 1328 | calculateCellWidth(Start: CellIter->Index, End: CellIter->EndIndex, WithSpaces: true) + |
| 1329 | NetWidth; |
| 1330 | if (Changes[CellIter->Index].NewlinesBefore == 0) { |
| 1331 | Changes[CellIter->Index].Spaces = (CellWidth - (ThisWidth + NetWidth)); |
| 1332 | Changes[CellIter->Index].Spaces += (i > 0) ? 1 : BracePadding; |
| 1333 | } |
| 1334 | alignToStartOfCell(Start: CellIter->Index, End: CellIter->EndIndex); |
| 1335 | for (const auto *Next = CellIter->NextColumnElement; Next; |
| 1336 | Next = Next->NextColumnElement) { |
| 1337 | ThisWidth = |
| 1338 | calculateCellWidth(Start: Next->Index, End: Next->EndIndex, WithSpaces: true) + NetWidth; |
| 1339 | if (Changes[Next->Index].NewlinesBefore == 0) { |
| 1340 | Changes[Next->Index].Spaces = (CellWidth - ThisWidth); |
| 1341 | Changes[Next->Index].Spaces += (i > 0) ? 1 : BracePadding; |
| 1342 | } |
| 1343 | alignToStartOfCell(Start: Next->Index, End: Next->EndIndex); |
| 1344 | } |
| 1345 | } |
| 1346 | } |
| 1347 | } |
| 1348 | |
| 1349 | void WhitespaceManager::alignArrayInitializersLeftJustified( |
| 1350 | CellDescriptions &&CellDescs) { |
| 1351 | |
| 1352 | if (!CellDescs.isRectangular()) |
| 1353 | return; |
| 1354 | |
| 1355 | const int BracePadding = |
| 1356 | Style.Cpp11BracedListStyle != FormatStyle::BLS_Block ? 0 : 1; |
| 1357 | auto &Cells = CellDescs.Cells; |
| 1358 | // Now go through and fixup the spaces. |
| 1359 | auto *CellIter = Cells.begin(); |
| 1360 | // The first cell of every row needs to be against the left brace. |
| 1361 | for (const auto *Next = CellIter; Next; Next = Next->NextColumnElement) { |
| 1362 | auto &Change = Changes[Next->Index]; |
| 1363 | Change.Spaces = |
| 1364 | Change.NewlinesBefore == 0 ? BracePadding : CellDescs.InitialSpaces; |
| 1365 | } |
| 1366 | ++CellIter; |
| 1367 | for (auto i = 1U; i < CellDescs.CellCounts[0]; i++, ++CellIter) { |
| 1368 | auto MaxNetWidth = getMaximumNetWidth( |
| 1369 | CellStart: Cells.begin(), CellStop: CellIter, InitialSpaces: CellDescs.InitialSpaces, |
| 1370 | CellCount: CellDescs.CellCounts[0], MaxRowCount: CellDescs.CellCounts.size()); |
| 1371 | auto ThisNetWidth = |
| 1372 | getNetWidth(Start: Cells.begin(), End: CellIter, InitialSpaces: CellDescs.InitialSpaces); |
| 1373 | if (Changes[CellIter->Index].NewlinesBefore == 0) { |
| 1374 | Changes[CellIter->Index].Spaces = |
| 1375 | MaxNetWidth - ThisNetWidth + |
| 1376 | (Changes[CellIter->Index].Tok->isNot(Kind: tok::r_brace) ? 1 |
| 1377 | : BracePadding); |
| 1378 | } |
| 1379 | auto RowCount = 1U; |
| 1380 | auto Offset = std::distance(first: Cells.begin(), last: CellIter); |
| 1381 | for (const auto *Next = CellIter->NextColumnElement; Next; |
| 1382 | Next = Next->NextColumnElement) { |
| 1383 | if (RowCount >= CellDescs.CellCounts.size()) |
| 1384 | break; |
| 1385 | auto *Start = (Cells.begin() + RowCount * CellDescs.CellCounts[0]); |
| 1386 | auto *End = Start + Offset; |
| 1387 | auto ThisNetWidth = getNetWidth(Start, End, InitialSpaces: CellDescs.InitialSpaces); |
| 1388 | if (Changes[Next->Index].NewlinesBefore == 0) { |
| 1389 | Changes[Next->Index].Spaces = |
| 1390 | MaxNetWidth - ThisNetWidth + |
| 1391 | (Changes[Next->Index].Tok->isNot(Kind: tok::r_brace) ? 1 : BracePadding); |
| 1392 | } |
| 1393 | ++RowCount; |
| 1394 | } |
| 1395 | } |
| 1396 | } |
| 1397 | |
| 1398 | bool WhitespaceManager::isSplitCell(const CellDescription &Cell) { |
| 1399 | if (Cell.HasSplit) |
| 1400 | return true; |
| 1401 | for (const auto *Next = Cell.NextColumnElement; Next; |
| 1402 | Next = Next->NextColumnElement) { |
| 1403 | if (Next->HasSplit) |
| 1404 | return true; |
| 1405 | } |
| 1406 | return false; |
| 1407 | } |
| 1408 | |
| 1409 | WhitespaceManager::CellDescriptions WhitespaceManager::getCells(unsigned Start, |
| 1410 | unsigned End) { |
| 1411 | |
| 1412 | unsigned Depth = 0; |
| 1413 | unsigned Cell = 0; |
| 1414 | SmallVector<unsigned> CellCounts; |
| 1415 | unsigned InitialSpaces = 0; |
| 1416 | unsigned InitialTokenLength = 0; |
| 1417 | unsigned EndSpaces = 0; |
| 1418 | SmallVector<CellDescription> Cells; |
| 1419 | const FormatToken *MatchingParen = nullptr; |
| 1420 | for (unsigned i = Start; i < End; ++i) { |
| 1421 | auto &C = Changes[i]; |
| 1422 | if (C.Tok->is(Kind: tok::l_brace)) |
| 1423 | ++Depth; |
| 1424 | else if (C.Tok->is(Kind: tok::r_brace)) |
| 1425 | --Depth; |
| 1426 | if (Depth == 2) { |
| 1427 | if (C.Tok->is(Kind: tok::l_brace)) { |
| 1428 | Cell = 0; |
| 1429 | MatchingParen = C.Tok->MatchingParen; |
| 1430 | if (InitialSpaces == 0) { |
| 1431 | InitialSpaces = C.Spaces + C.TokenLength; |
| 1432 | InitialTokenLength = C.TokenLength; |
| 1433 | auto j = i - 1; |
| 1434 | for (; Changes[j].NewlinesBefore == 0 && j > Start; --j) { |
| 1435 | InitialSpaces += Changes[j].Spaces + Changes[j].TokenLength; |
| 1436 | InitialTokenLength += Changes[j].TokenLength; |
| 1437 | } |
| 1438 | if (C.NewlinesBefore == 0) { |
| 1439 | InitialSpaces += Changes[j].Spaces + Changes[j].TokenLength; |
| 1440 | InitialTokenLength += Changes[j].TokenLength; |
| 1441 | } |
| 1442 | } |
| 1443 | } else if (C.Tok->is(Kind: tok::comma)) { |
| 1444 | if (!Cells.empty()) |
| 1445 | Cells.back().EndIndex = i; |
| 1446 | if (const auto *Next = C.Tok->getNextNonComment(); |
| 1447 | Next && Next->isNot(Kind: tok::r_brace)) { // dangling comma |
| 1448 | ++Cell; |
| 1449 | } |
| 1450 | } |
| 1451 | } else if (Depth == 1) { |
| 1452 | if (C.Tok == MatchingParen) { |
| 1453 | if (!Cells.empty()) |
| 1454 | Cells.back().EndIndex = i; |
| 1455 | Cells.push_back(Elt: CellDescription{.Index: i, .Cell: ++Cell, .EndIndex: i + 1, .HasSplit: false, .NextColumnElement: nullptr}); |
| 1456 | CellCounts.push_back(Elt: C.Tok->Previous->isNot(Kind: tok::comma) ? Cell + 1 |
| 1457 | : Cell); |
| 1458 | // Go to the next non-comment and ensure there is a break in front |
| 1459 | const auto * = C.Tok->getNextNonComment(); |
| 1460 | while (NextNonComment && NextNonComment->is(Kind: tok::comma)) |
| 1461 | NextNonComment = NextNonComment->getNextNonComment(); |
| 1462 | auto j = i; |
| 1463 | while (j < End && Changes[j].Tok != NextNonComment) |
| 1464 | ++j; |
| 1465 | if (j < End && Changes[j].NewlinesBefore == 0 && |
| 1466 | Changes[j].Tok->isNot(Kind: tok::r_brace)) { |
| 1467 | Changes[j].NewlinesBefore = 1; |
| 1468 | // Account for the added token lengths |
| 1469 | Changes[j].Spaces = InitialSpaces - InitialTokenLength; |
| 1470 | } |
| 1471 | } else if (C.Tok->is(Kind: tok::comment) && C.Tok->NewlinesBefore == 0) { |
| 1472 | // Trailing comments stay at a space past the last token |
| 1473 | C.Spaces = Changes[i - 1].Tok->is(Kind: tok::comma) ? 1 : 2; |
| 1474 | } else if (C.Tok->is(Kind: tok::l_brace)) { |
| 1475 | // We need to make sure that the ending braces is aligned to the |
| 1476 | // start of our initializer |
| 1477 | auto j = i - 1; |
| 1478 | for (; j > 0 && !Changes[j].Tok->ArrayInitializerLineStart; --j) |
| 1479 | ; // Nothing the loop does the work |
| 1480 | EndSpaces = Changes[j].Spaces; |
| 1481 | } |
| 1482 | } else if (Depth == 0 && C.Tok->is(Kind: tok::r_brace)) { |
| 1483 | C.NewlinesBefore = 1; |
| 1484 | C.Spaces = EndSpaces; |
| 1485 | } |
| 1486 | if (C.Tok->StartsColumn) { |
| 1487 | // This gets us past tokens that have been split over multiple |
| 1488 | // lines |
| 1489 | bool HasSplit = false; |
| 1490 | if (Changes[i].NewlinesBefore > 0) { |
| 1491 | // So if we split a line previously and the tail line + this token is |
| 1492 | // less then the column limit we remove the split here and just put |
| 1493 | // the column start at a space past the comma |
| 1494 | // |
| 1495 | // FIXME This if branch covers the cases where the column is not |
| 1496 | // the first column. This leads to weird pathologies like the formatting |
| 1497 | // auto foo = Items{ |
| 1498 | // Section{ |
| 1499 | // 0, bar(), |
| 1500 | // } |
| 1501 | // }; |
| 1502 | // Well if it doesn't lead to that it's indicative that the line |
| 1503 | // breaking should be revisited. Unfortunately alot of other options |
| 1504 | // interact with this |
| 1505 | auto j = i - 1; |
| 1506 | if ((j - 1) > Start && Changes[j].Tok->is(Kind: tok::comma) && |
| 1507 | Changes[j - 1].NewlinesBefore > 0) { |
| 1508 | --j; |
| 1509 | auto LineLimit = Changes[j].Spaces + Changes[j].TokenLength; |
| 1510 | if (LineLimit < Style.ColumnLimit) { |
| 1511 | Changes[i].NewlinesBefore = 0; |
| 1512 | Changes[i].Spaces = 1; |
| 1513 | } |
| 1514 | } |
| 1515 | } |
| 1516 | while (Changes[i].NewlinesBefore > 0 && Changes[i].Tok == C.Tok) { |
| 1517 | Changes[i].Spaces = InitialSpaces; |
| 1518 | ++i; |
| 1519 | HasSplit = true; |
| 1520 | } |
| 1521 | if (Changes[i].Tok != C.Tok) |
| 1522 | --i; |
| 1523 | Cells.push_back(Elt: CellDescription{.Index: i, .Cell: Cell, .EndIndex: i, .HasSplit: HasSplit, .NextColumnElement: nullptr}); |
| 1524 | } |
| 1525 | } |
| 1526 | |
| 1527 | return linkCells(CellDesc: {.Cells: Cells, .CellCounts: CellCounts, .InitialSpaces: InitialSpaces}); |
| 1528 | } |
| 1529 | |
| 1530 | unsigned WhitespaceManager::calculateCellWidth(unsigned Start, unsigned End, |
| 1531 | bool WithSpaces) const { |
| 1532 | unsigned CellWidth = 0; |
| 1533 | for (auto i = Start; i < End; i++) { |
| 1534 | if (Changes[i].NewlinesBefore > 0) |
| 1535 | CellWidth = 0; |
| 1536 | CellWidth += Changes[i].TokenLength; |
| 1537 | CellWidth += (WithSpaces ? Changes[i].Spaces : 0); |
| 1538 | } |
| 1539 | return CellWidth; |
| 1540 | } |
| 1541 | |
| 1542 | void WhitespaceManager::alignToStartOfCell(unsigned Start, unsigned End) { |
| 1543 | if ((End - Start) <= 1) |
| 1544 | return; |
| 1545 | // If the line is broken anywhere in there make sure everything |
| 1546 | // is aligned to the parent |
| 1547 | for (auto i = Start + 1; i < End; i++) |
| 1548 | if (Changes[i].NewlinesBefore > 0) |
| 1549 | Changes[i].Spaces = Changes[Start].Spaces; |
| 1550 | } |
| 1551 | |
| 1552 | WhitespaceManager::CellDescriptions |
| 1553 | WhitespaceManager::linkCells(CellDescriptions &&CellDesc) { |
| 1554 | auto &Cells = CellDesc.Cells; |
| 1555 | for (auto *CellIter = Cells.begin(); CellIter != Cells.end(); ++CellIter) { |
| 1556 | if (!CellIter->NextColumnElement && (CellIter + 1) != Cells.end()) { |
| 1557 | for (auto *NextIter = CellIter + 1; NextIter != Cells.end(); ++NextIter) { |
| 1558 | if (NextIter->Cell == CellIter->Cell) { |
| 1559 | CellIter->NextColumnElement = &(*NextIter); |
| 1560 | break; |
| 1561 | } |
| 1562 | } |
| 1563 | } |
| 1564 | } |
| 1565 | return std::move(CellDesc); |
| 1566 | } |
| 1567 | |
| 1568 | void WhitespaceManager::generateChanges() { |
| 1569 | for (unsigned i = 0, e = Changes.size(); i != e; ++i) { |
| 1570 | const Change &C = Changes[i]; |
| 1571 | if (i > 0) { |
| 1572 | auto Last = Changes[i - 1].OriginalWhitespaceRange; |
| 1573 | auto New = Changes[i].OriginalWhitespaceRange; |
| 1574 | // Do not generate two replacements for the same location. As a special |
| 1575 | // case, it is allowed if there is a replacement for the empty range |
| 1576 | // between 2 tokens and another non-empty range at the start of the second |
| 1577 | // token. We didn't implement logic to combine replacements for 2 |
| 1578 | // consecutive source ranges into a single replacement, because the |
| 1579 | // program works fine without it. |
| 1580 | // |
| 1581 | // We can't eliminate empty original whitespace ranges. They appear when |
| 1582 | // 2 tokens have no whitespace in between in the input. It does not |
| 1583 | // matter whether whitespace is to be added. If no whitespace is to be |
| 1584 | // added, the replacement will be empty, and it gets eliminated after this |
| 1585 | // step in storeReplacement. For example, if the input is `foo();`, |
| 1586 | // there will be a replacement for the range between every consecutive |
| 1587 | // pair of tokens. |
| 1588 | // |
| 1589 | // A replacement at the start of a token can be added by |
| 1590 | // BreakableStringLiteralUsingOperators::insertBreak when it adds braces |
| 1591 | // around the string literal. Say Verilog code is being formatted and the |
| 1592 | // first line is to become the next 2 lines. |
| 1593 | // x("long string"); |
| 1594 | // x({"long ", |
| 1595 | // "string"}); |
| 1596 | // There will be a replacement for the empty range between the parenthesis |
| 1597 | // and the string and another replacement for the quote character. The |
| 1598 | // replacement for the empty range between the parenthesis and the quote |
| 1599 | // comes from ContinuationIndenter::addTokenOnCurrentLine when it changes |
| 1600 | // the original empty range between the parenthesis and the string to |
| 1601 | // another empty one. The replacement for the quote character comes from |
| 1602 | // BreakableStringLiteralUsingOperators::insertBreak when it adds the |
| 1603 | // brace. In the example, the replacement for the empty range is the same |
| 1604 | // as the original text. However, eliminating replacements that are same |
| 1605 | // as the original does not help in general. For example, a newline can |
| 1606 | // be inserted, causing the first line to become the next 3 lines. |
| 1607 | // xxxxxxxxxxx("long string"); |
| 1608 | // xxxxxxxxxxx( |
| 1609 | // {"long ", |
| 1610 | // "string"}); |
| 1611 | // In that case, the empty range between the parenthesis and the string |
| 1612 | // will be replaced by a newline and 4 spaces. So we will still have to |
| 1613 | // deal with a replacement for an empty source range followed by a |
| 1614 | // replacement for a non-empty source range. |
| 1615 | if (Last.getBegin() == New.getBegin() && |
| 1616 | (Last.getEnd() != Last.getBegin() || |
| 1617 | New.getEnd() == New.getBegin())) { |
| 1618 | continue; |
| 1619 | } |
| 1620 | } |
| 1621 | if (C.CreateReplacement) { |
| 1622 | std::string ReplacementText = C.PreviousLinePostfix; |
| 1623 | if (C.ContinuesPPDirective) { |
| 1624 | appendEscapedNewlineText(Text&: ReplacementText, Newlines: C.NewlinesBefore, |
| 1625 | PreviousEndOfTokenColumn: C.PreviousEndOfTokenColumn, |
| 1626 | EscapedNewlineColumn: C.EscapedNewlineColumn); |
| 1627 | } else { |
| 1628 | appendNewlineText(Text&: ReplacementText, C); |
| 1629 | } |
| 1630 | // FIXME: This assert should hold if we computed the column correctly. |
| 1631 | // assert((int)C.StartOfTokenColumn >= C.Spaces); |
| 1632 | appendIndentText( |
| 1633 | Text&: ReplacementText, IndentLevel: C.Tok->IndentLevel, Spaces: std::max(a: 0, b: C.Spaces), |
| 1634 | WhitespaceStartColumn: std::max(a: (int)C.StartOfTokenColumn, b: C.Spaces) - std::max(a: 0, b: C.Spaces), |
| 1635 | IsAligned: C.IsAligned); |
| 1636 | ReplacementText.append(str: C.CurrentLinePrefix); |
| 1637 | storeReplacement(Range: C.OriginalWhitespaceRange, Text: ReplacementText); |
| 1638 | } |
| 1639 | } |
| 1640 | } |
| 1641 | |
| 1642 | void WhitespaceManager::storeReplacement(SourceRange Range, StringRef Text) { |
| 1643 | unsigned WhitespaceLength = SourceMgr.getFileOffset(SpellingLoc: Range.getEnd()) - |
| 1644 | SourceMgr.getFileOffset(SpellingLoc: Range.getBegin()); |
| 1645 | // Don't create a replacement, if it does not change anything. |
| 1646 | if (StringRef(SourceMgr.getCharacterData(SL: Range.getBegin()), |
| 1647 | WhitespaceLength) == Text) { |
| 1648 | return; |
| 1649 | } |
| 1650 | auto Err = Replaces.add(R: tooling::Replacement( |
| 1651 | SourceMgr, CharSourceRange::getCharRange(R: Range), Text)); |
| 1652 | // FIXME: better error handling. For now, just print an error message in the |
| 1653 | // release version. |
| 1654 | if (Err) { |
| 1655 | llvm::errs() << llvm::toString(E: std::move(Err)) << "\n" ; |
| 1656 | assert(false); |
| 1657 | } |
| 1658 | } |
| 1659 | |
| 1660 | void WhitespaceManager::appendNewlineText(std::string &Text, const Change &C) { |
| 1661 | if (C.NewlinesBefore <= 0) |
| 1662 | return; |
| 1663 | |
| 1664 | StringRef Newline = UseCRLF ? "\r\n" : "\n" ; |
| 1665 | Text.append(svt: Newline); |
| 1666 | |
| 1667 | if (C.Tok->HasFormFeedBefore) |
| 1668 | Text.append(s: "\f" ); |
| 1669 | |
| 1670 | for (unsigned I = 1; I < C.NewlinesBefore; ++I) |
| 1671 | Text.append(svt: Newline); |
| 1672 | } |
| 1673 | |
| 1674 | void WhitespaceManager::appendEscapedNewlineText( |
| 1675 | std::string &Text, unsigned Newlines, unsigned PreviousEndOfTokenColumn, |
| 1676 | unsigned EscapedNewlineColumn) { |
| 1677 | if (Newlines > 0) { |
| 1678 | unsigned Spaces = |
| 1679 | std::max<int>(a: 1, b: EscapedNewlineColumn - PreviousEndOfTokenColumn - 1); |
| 1680 | for (unsigned i = 0; i < Newlines; ++i) { |
| 1681 | Text.append(n: Spaces, c: ' '); |
| 1682 | Text.append(s: UseCRLF ? "\\\r\n" : "\\\n" ); |
| 1683 | Spaces = std::max<int>(a: 0, b: EscapedNewlineColumn - 1); |
| 1684 | } |
| 1685 | } |
| 1686 | } |
| 1687 | |
| 1688 | void WhitespaceManager::appendIndentText(std::string &Text, |
| 1689 | unsigned IndentLevel, unsigned Spaces, |
| 1690 | unsigned WhitespaceStartColumn, |
| 1691 | bool IsAligned) { |
| 1692 | switch (Style.UseTab) { |
| 1693 | case FormatStyle::UT_Never: |
| 1694 | Text.append(n: Spaces, c: ' '); |
| 1695 | break; |
| 1696 | case FormatStyle::UT_Always: { |
| 1697 | if (Style.TabWidth) { |
| 1698 | unsigned FirstTabWidth = |
| 1699 | Style.TabWidth - WhitespaceStartColumn % Style.TabWidth; |
| 1700 | |
| 1701 | // Insert only spaces when we want to end up before the next tab. |
| 1702 | if (Spaces < FirstTabWidth || Spaces == 1) { |
| 1703 | Text.append(n: Spaces, c: ' '); |
| 1704 | break; |
| 1705 | } |
| 1706 | // Align to the next tab. |
| 1707 | Spaces -= FirstTabWidth; |
| 1708 | Text.append(s: "\t" ); |
| 1709 | |
| 1710 | Text.append(n: Spaces / Style.TabWidth, c: '\t'); |
| 1711 | Text.append(n: Spaces % Style.TabWidth, c: ' '); |
| 1712 | } else if (Spaces == 1) { |
| 1713 | Text.append(n: Spaces, c: ' '); |
| 1714 | } |
| 1715 | break; |
| 1716 | } |
| 1717 | case FormatStyle::UT_ForIndentation: |
| 1718 | if (WhitespaceStartColumn == 0) { |
| 1719 | unsigned Indentation = IndentLevel * Style.IndentWidth; |
| 1720 | Spaces = appendTabIndent(Text, Spaces, Indentation); |
| 1721 | } |
| 1722 | Text.append(n: Spaces, c: ' '); |
| 1723 | break; |
| 1724 | case FormatStyle::UT_ForContinuationAndIndentation: |
| 1725 | if (WhitespaceStartColumn == 0) |
| 1726 | Spaces = appendTabIndent(Text, Spaces, Indentation: Spaces); |
| 1727 | Text.append(n: Spaces, c: ' '); |
| 1728 | break; |
| 1729 | case FormatStyle::UT_AlignWithSpaces: |
| 1730 | if (WhitespaceStartColumn == 0) { |
| 1731 | unsigned Indentation = |
| 1732 | IsAligned ? IndentLevel * Style.IndentWidth : Spaces; |
| 1733 | Spaces = appendTabIndent(Text, Spaces, Indentation); |
| 1734 | } |
| 1735 | Text.append(n: Spaces, c: ' '); |
| 1736 | break; |
| 1737 | } |
| 1738 | } |
| 1739 | |
| 1740 | unsigned WhitespaceManager::appendTabIndent(std::string &Text, unsigned Spaces, |
| 1741 | unsigned Indentation) { |
| 1742 | // This happens, e.g. when a line in a block comment is indented less than the |
| 1743 | // first one. |
| 1744 | if (Indentation > Spaces) |
| 1745 | Indentation = Spaces; |
| 1746 | if (Style.TabWidth) { |
| 1747 | unsigned Tabs = Indentation / Style.TabWidth; |
| 1748 | Text.append(n: Tabs, c: '\t'); |
| 1749 | Spaces -= Tabs * Style.TabWidth; |
| 1750 | } |
| 1751 | return Spaces; |
| 1752 | } |
| 1753 | |
| 1754 | } // namespace format |
| 1755 | } // namespace clang |
| 1756 | |