WhitespaceManager.cpp source code [llvm_projects/clang/lib/Format/WhitespaceManager.cpp]

1	//===--- WhitespaceManager.cpp - Format C++ code --------------------------===//
2	//
3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4	// See https://llvm.org/LICENSE.txt for license information.
5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6	//
7	//===----------------------------------------------------------------------===//
8	///
9	/// \file
10	/// This file implements WhitespaceManager class.
11	///
12	//===----------------------------------------------------------------------===//
13
14	#include "WhitespaceManager.h"
15	#include "llvm/ADT/STLExtras.h"
16	#include "llvm/ADT/SmallVector.h"
17	#include <algorithm>
18
19	namespace clang {
20	namespace format {
21
22	bool WhitespaceManager::Change::IsBeforeInFile::operator()(
23	const Change &C1, const Change &C2) const {
24	return SourceMgr.isBeforeInTranslationUnit(
25	LHS: C1.OriginalWhitespaceRange.getBegin(),
26	RHS: C2.OriginalWhitespaceRange.getBegin()) \|\|
27	(C1.OriginalWhitespaceRange.getBegin() ==
28	C2.OriginalWhitespaceRange.getBegin() &&
29	SourceMgr.isBeforeInTranslationUnit(
30	LHS: C1.OriginalWhitespaceRange.getEnd(),
31	RHS: C2.OriginalWhitespaceRange.getEnd()));
32	}
33
34	WhitespaceManager::Change::Change(const FormatToken &Tok,
35	bool CreateReplacement,
36	SourceRange OriginalWhitespaceRange,
37	int Spaces, unsigned StartOfTokenColumn,
38	unsigned NewlinesBefore,
39	StringRef PreviousLinePostfix,
40	StringRef CurrentLinePrefix, bool IsAligned,
41	bool ContinuesPPDirective, bool IsInsideToken)
42	: Tok(&Tok), CreateReplacement(CreateReplacement),
43	OriginalWhitespaceRange (OriginalWhitespaceRange),
44	StartOfTokenColumn(StartOfTokenColumn), NewlinesBefore(NewlinesBefore),
45	PreviousLinePostfix (PreviousLinePostfix),
46	CurrentLinePrefix (CurrentLinePrefix), IsAligned(IsAligned),
47	ContinuesPPDirective(ContinuesPPDirective), Spaces(Spaces),
48	IsInsideToken(IsInsideToken), IsTrailingComment(false), TokenLength(`0`),
49	PreviousEndOfTokenColumn(`0`), EscapedNewlineColumn(`0`),
50	StartOfBlockComment(nullptr), IndentationOffset(`0`), ConditionalsLevel(`0`) {
51	}
52
53	void WhitespaceManager::replaceWhitespace(FormatToken &Tok, unsigned Newlines,
54	unsigned Spaces,
55	unsigned StartOfTokenColumn,
56	bool IsAligned, bool InPPDirective) {
57	if (Tok.Finalized \|\| (Tok.MacroCtx && Tok.MacroCtx ->Role == MR_ExpandedArg))
58	return;
59	Tok.setDecision((Newlines > `0`) ? FD_Break : FD_Continue);
60	Changes.push_back(Elt: Change (Tok, /CreateReplacement=/true, Tok.WhitespaceRange,
61	Spaces, StartOfTokenColumn, Newlines, "", "",
62	IsAligned, InPPDirective && !Tok.IsFirst,
63	/IsInsideToken=/false));
64	}
65
66	void WhitespaceManager::addUntouchableToken(const FormatToken &Tok,
67	bool InPPDirective) {
68	if (Tok.Finalized \|\| (Tok.MacroCtx && Tok.MacroCtx ->Role == MR_ExpandedArg))
69	return;
70	Changes.push_back(Elt: Change (Tok, /CreateReplacement=/false,
71	Tok.WhitespaceRange, /Spaces=/`0`,
72	Tok.OriginalColumn, Tok.NewlinesBefore, "", "",
73	/IsAligned=/false, InPPDirective && !Tok.IsFirst,
74	/IsInsideToken=/false));
75	}
76
77	llvm::Error
78	WhitespaceManager::addReplacement(const tooling::Replacement &Replacement) {
79	return Replaces.add(R: Replacement);
80	}
81
82	bool WhitespaceManager::inputUsesCRLF(StringRef Text, bool DefaultToCRLF) {
83	size_t LF = Text.count(C: `'\n'`);
84	size_t CR = Text.count(C: `'\r'`) * `2`;
85	return LF == CR ? DefaultToCRLF : CR > LF;
86	}
87
88	void WhitespaceManager::replaceWhitespaceInToken(
89	const FormatToken &Tok, unsigned Offset, unsigned ReplaceChars,
90	StringRef PreviousPostfix, StringRef CurrentPrefix, bool InPPDirective,
91	unsigned Newlines, int Spaces) {
92	if (Tok.Finalized \|\| (Tok.MacroCtx && Tok.MacroCtx ->Role == MR_ExpandedArg))
93	return;
94	SourceLocation Start = Tok.getStartOfNonWhitespace().getLocWithOffset(Offset);
95	Changes.push_back(
96	Elt: Change (Tok, /CreateReplacement=/true,
97	SourceRange (Start, Start.getLocWithOffset(Offset: ReplaceChars)), Spaces,
98	std::max(a: `0`, b: Spaces), Newlines, PreviousPostfix, CurrentPrefix,
99	/IsAligned=/true, InPPDirective && !Tok.IsFirst,
100	/IsInsideToken=/true));
101	}
102
103	const tooling::Replacements &WhitespaceManager::generateReplacements() {
104	if (Changes.empty())
105	return Replaces;
106
107	llvm::sort(C&: Changes, Comp: Change::IsBeforeInFile (SourceMgr));
108	calculateLineBreakInformation();
109	alignConsecutiveMacros();
110	alignConsecutiveShortCaseStatements(/IsExpr=/true);
111	alignConsecutiveShortCaseStatements(/IsExpr=/false);
112	alignConsecutiveDeclarations();
113	alignConsecutiveBitFields();
114	alignConsecutiveAssignments();
115	if (Style.isTableGen()) {
116	alignConsecutiveTableGenBreakingDAGArgColons();
117	alignConsecutiveTableGenCondOperatorColons();
118	alignConsecutiveTableGenDefinitions();
119	}
120	alignChainedConditionals();
121	alignTrailingComments();
122	alignEscapedNewlines();
123	alignArrayInitializers();
124	generateChanges();
125
126	return Replaces;
127	}
128
129	void WhitespaceManager::calculateLineBreakInformation() {
130	Changes [`0`].PreviousEndOfTokenColumn = `0`;
131	Change *LastOutsideTokenChange = &Changes [`0`];
132	for (unsigned I = `1`, e = Changes.size(); I != e; ++I) {
133	auto &C = Changes [I];
134	auto &P = Changes [I - `1`];
135	auto &PrevTokLength = P.TokenLength;
136	SourceLocation OriginalWhitespaceStart =
137	C.OriginalWhitespaceRange.getBegin();
138	SourceLocation PreviousOriginalWhitespaceEnd =
139	P.OriginalWhitespaceRange.getEnd();
140	unsigned OriginalWhitespaceStartOffset =
141	SourceMgr.getFileOffset(SpellingLoc: OriginalWhitespaceStart);
142	unsigned PreviousOriginalWhitespaceEndOffset =
143	SourceMgr.getFileOffset(SpellingLoc: PreviousOriginalWhitespaceEnd);
144	assert(PreviousOriginalWhitespaceEndOffset <=
145	OriginalWhitespaceStartOffset);
146	const char *const PreviousOriginalWhitespaceEndData =
147	SourceMgr.getCharacterData(SL: PreviousOriginalWhitespaceEnd);
148	StringRef Text(PreviousOriginalWhitespaceEndData,
149	SourceMgr.getCharacterData(SL: OriginalWhitespaceStart) -
150	PreviousOriginalWhitespaceEndData);
151	// Usually consecutive changes would occur in consecutive tokens. This is
152	// not the case however when analyzing some preprocessor runs of the
153	// annotated lines. For example, in this code:
154	//
155	// #if A // line 1
156	// int i = 1;
157	// #else B // line 2
158	// int i = 2;
159	// #endif // line 3
160	//
161	// one of the runs will produce the sequence of lines marked with line 1, 2
162	// and 3. So the two consecutive whitespace changes just before '// line 2'
163	// and before '#endif // line 3' span multiple lines and tokens:
164	//
165	// #else B{change X}[// line 2
166	// int i = 2;
167	// ]{change Y}#endif // line 3
168	//
169	// For this reason, if the text between consecutive changes spans multiple
170	// newlines, the token length must be adjusted to the end of the original
171	// line of the token.
172	auto NewlinePos = Text.find_first_of(C: `'\n'`);
173	if (NewlinePos == StringRef::npos) {
174	PrevTokLength = OriginalWhitespaceStartOffset -
175	PreviousOriginalWhitespaceEndOffset +
176	C.PreviousLinePostfix.size() + P.CurrentLinePrefix.size();
177	if (!P.IsInsideToken)
178	PrevTokLength = std::min(a: PrevTokLength, b: P.Tok->ColumnWidth);
179	} else {
180	PrevTokLength = NewlinePos + P.CurrentLinePrefix.size();
181	}
182
183	// If there are multiple changes in this token, sum up all the changes until
184	// the end of the line.
185	if (P.IsInsideToken && P.NewlinesBefore == `0`)
186	LastOutsideTokenChange->TokenLength += PrevTokLength + P.Spaces;
187	else
188	LastOutsideTokenChange = &P;
189
190	C.PreviousEndOfTokenColumn = P.StartOfTokenColumn + PrevTokLength;
191
192	P.IsTrailingComment =
193	(C.NewlinesBefore > `0` \|\| C.Tok->is(Kind: tok::eof) \|\|
194	(C.IsInsideToken && C.Tok->is(Kind: tok::comment))) &&
195	P.Tok->is(Kind: tok::comment) &&
196	// FIXME: This is a dirty hack. The problem is that
197	// BreakableLineCommentSection does comment reflow changes and here is
198	// the aligning of trailing comments. Consider the case where we reflow
199	// the second line up in this example:
200	//
201	// // line 1
202	// // line 2
203	//
204	// That amounts to 2 changes by BreakableLineCommentSection:
205	// - the first, delimited by (), for the whitespace between the tokens,
206	// - and second, delimited by [], for the whitespace at the beginning
207	// of the second token:
208	//
209	// // line 1(
210	// )[// ]line 2
211	//
212	// So in the end we have two changes like this:
213	//
214	// // line1()[ ]line 2
215	//
216	// Note that the OriginalWhitespaceStart of the second change is the
217	// same as the PreviousOriginalWhitespaceEnd of the first change.
218	// In this case, the below check ensures that the second change doesn't
219	// get treated as a trailing comment change here, since this might
220	// trigger additional whitespace to be wrongly inserted before "line 2"
221	// by the comment aligner here.
222	//
223	// For a proper solution we need a mechanism to say to WhitespaceManager
224	// that a particular change breaks the current sequence of trailing
225	// comments.
226	OriginalWhitespaceStart != PreviousOriginalWhitespaceEnd;
227	}
228	// FIXME: The last token is currently not always an eof token; in those
229	// cases, setting TokenLength of the last token to 0 is wrong.
230	Changes.back().TokenLength = `0`;
231	Changes.back().IsTrailingComment = Changes.back().Tok->is(Kind: tok::comment);
232
233	const WhitespaceManager::Change LastBlockComment = nullptr*;
234	for (auto &Change : Changes) {
235	// Reset the IsTrailingComment flag for changes inside of trailing comments
236	// so they don't get realigned later. Comment line breaks however still need
237	// to be aligned.
238	if (Change.IsInsideToken && Change.NewlinesBefore == `0`)
239	Change.IsTrailingComment = false;
240	Change.StartOfBlockComment = nullptr;
241	Change.IndentationOffset = `0`;
242	if (Change.Tok->is(Kind: tok::comment)) {
243	if (Change.Tok->is(TT: TT_LineComment) \|\| !Change.IsInsideToken) {
244	LastBlockComment = &Change;
245	} else if ((Change.StartOfBlockComment = LastBlockComment)) {
246	Change.IndentationOffset =
247	Change.StartOfTokenColumn -
248	Change.StartOfBlockComment->StartOfTokenColumn;
249	}
250	} else {
251	LastBlockComment = nullptr;
252	}
253	}
254
255	// Compute conditional nesting level
256	// Level is increased for each conditional, unless this conditional continues
257	// a chain of conditional, i.e. starts immediately after the colon of another
258	// conditional.
259	SmallVector<bool, `16`> ScopeStack;
260	int ConditionalsLevel = `0`;
261	for (auto &Change : Changes) {
262	for (unsigned i = `0`, e = Change.Tok->FakeLParens.size(); i != e; ++i) {
263	bool isNestedConditional =
264	Change.Tok->FakeLParens [e - `1` - i] == prec::Conditional &&
265	!(i == `0` && Change.Tok->Previous &&
266	Change.Tok->Previous->is(TT: TT_ConditionalExpr) &&
267	Change.Tok->Previous->is(Kind: tok::colon));
268	if (isNestedConditional)
269	++ConditionalsLevel;
270	ScopeStack.push_back(Elt: isNestedConditional);
271	}
272
273	Change.ConditionalsLevel = ConditionalsLevel;
274
275	for (unsigned i = Change.Tok->FakeRParens; i > `0` && ScopeStack.size(); --i)
276	if (ScopeStack.pop_back_val())
277	--ConditionalsLevel;
278	}
279	}
280
281	// Align a single sequence of tokens, see AlignTokens below.
282	// Column - The token for which Matches returns true is moved to this column.
283	// RightJustify - Whether it is the token's right end or left end that gets
284	// moved to that column.
285	template <typename F>
286	static void
287	AlignTokenSequence(const FormatStyle &Style, unsigned Start, unsigned End,
288	unsigned Column, bool RightJustify, F &&Matches,
289	SmallVector<WhitespaceManager::Change, `16`> &Changes) {
290	bool FoundMatchOnLine = false;
291	int Shift = `0`;
292
293	// ScopeStack keeps track of the current scope depth. It contains indices of
294	// the first token on each scope.
295	// We only run the "Matches" function on tokens from the outer-most scope.
296	// However, we do need to pay special attention to one class of tokens
297	// that are not in the outer-most scope, and that is function parameters
298	// which are split across multiple lines, as illustrated by this example:
299	// double a(int x);
300	// int b(int y,
301	// double z);
302	// In the above example, we need to take special care to ensure that
303	// 'double z' is indented along with it's owning function 'b'.
304	// The same holds for calling a function:
305	// double a = foo(x);
306	// int b = bar(foo(y),
307	// foor(z));
308	// Similar for broken string literals:
309	// double x = 3.14;
310	// auto s = "Hello"
311	// "World";
312	// Special handling is required for 'nested' ternary operators.
313	SmallVector<unsigned, `16`> ScopeStack;
314
315	for (unsigned i = Start; i != End; ++i) {
316	auto &CurrentChange = Changes [i];
317	if (ScopeStack.size() != `0` &&
318	CurrentChange.indentAndNestingLevel() <
319	Changes [ScopeStack.back()].indentAndNestingLevel()) {
320	ScopeStack.pop_back();
321	}
322
323	// Compare current token to previous non-comment token to ensure whether
324	// it is in a deeper scope or not.
325	unsigned PreviousNonComment = i - `1`;
326	while (PreviousNonComment > Start &&
327	Changes [PreviousNonComment].Tok->is(Kind: tok::comment)) {
328	--PreviousNonComment;
329	}
330	if (i != Start && CurrentChange.indentAndNestingLevel() >
331	Changes [PreviousNonComment].indentAndNestingLevel()) {
332	ScopeStack.push_back(Elt: i);
333	}
334
335	bool InsideNestedScope = ScopeStack.size() != `0`;
336	bool ContinuedStringLiteral = i > Start &&
337	CurrentChange.Tok->is(Kind: tok::string_literal) &&
338	Changes [i - `1`].Tok->is(Kind: tok::string_literal);
339	bool SkipMatchCheck = InsideNestedScope \|\| ContinuedStringLiteral;
340
341	if (CurrentChange.NewlinesBefore > `0` && !SkipMatchCheck) {
342	Shift = `0`;
343	FoundMatchOnLine = false;
344	}
345
346	// If this is the first matching token to be aligned, remember by how many
347	// spaces it has to be shifted, so the rest of the changes on the line are
348	// shifted by the same amount
349	if (!FoundMatchOnLine && !SkipMatchCheck && Matches(CurrentChange)) {
350	FoundMatchOnLine = true;
351	Shift = Column - (RightJustify ? CurrentChange.TokenLength : `0`) -
352	CurrentChange.StartOfTokenColumn;
353	CurrentChange.Spaces += Shift;
354	// FIXME: This is a workaround that should be removed when we fix
355	// http://llvm.org/PR53699. An assertion later below verifies this.
356	if (CurrentChange.NewlinesBefore == `0`) {
357	CurrentChange.Spaces =
358	std::max(a: CurrentChange.Spaces,
359	b: static_cast<int>(CurrentChange.Tok->SpacesRequiredBefore));
360	}
361	}
362
363	if (Shift == `0`)
364	continue;
365
366	// This is for function parameters that are split across multiple lines,
367	// as mentioned in the ScopeStack comment.
368	if (InsideNestedScope && CurrentChange.NewlinesBefore > `0`) {
369	unsigned ScopeStart = ScopeStack.back();
370	auto ShouldShiftBeAdded = [&] {
371	// Function declaration
372	if (Changes [ScopeStart - `1`].Tok->is(TT: TT_FunctionDeclarationName))
373	return true;
374
375	// Lambda.
376	if (Changes [ScopeStart - `1`].Tok->is(TT: TT_LambdaLBrace))
377	return false;
378
379	// Continued function declaration
380	if (ScopeStart > Start + `1` &&
381	Changes [ScopeStart - `2`].Tok->is(TT: TT_FunctionDeclarationName)) {
382	return true;
383	}
384
385	// Continued (template) function call.
386	if (ScopeStart > Start + `1` &&
387	Changes [ScopeStart - `2`].Tok->isOneOf(K1: tok::identifier,
388	K2: TT_TemplateCloser) &&
389	Changes [ScopeStart - `1`].Tok->is(Kind: tok::l_paren) &&
390	Changes [ScopeStart].Tok->isNot(Kind: TT_LambdaLSquare)) {
391	if (CurrentChange.Tok->MatchingParen &&
392	CurrentChange.Tok->MatchingParen->is(TT: TT_LambdaLBrace)) {
393	return false;
394	}
395	if (Changes [ScopeStart].NewlinesBefore > `0`)
396	return false;
397	if (CurrentChange.Tok->is(Kind: tok::l_brace) &&
398	CurrentChange.Tok->is(BBK: BK_BracedInit)) {
399	return true;
400	}
401	return Style.BinPackArguments;
402	}
403
404	// Ternary operator
405	if (CurrentChange.Tok->is(TT: TT_ConditionalExpr))
406	return true;
407
408	// Period Initializer .XXX = 1.
409	if (CurrentChange.Tok->is(TT: TT_DesignatedInitializerPeriod))
410	return true;
411
412	// Continued ternary operator
413	if (CurrentChange.Tok->Previous &&
414	CurrentChange.Tok->Previous->is(TT: TT_ConditionalExpr)) {
415	return true;
416	}
417
418	// Continued direct-list-initialization using braced list.
419	if (ScopeStart > Start + `1` &&
420	Changes [ScopeStart - `2`].Tok->is(Kind: tok::identifier) &&
421	Changes [ScopeStart - `1`].Tok->is(Kind: tok::l_brace) &&
422	CurrentChange.Tok->is(Kind: tok::l_brace) &&
423	CurrentChange.Tok->is(BBK: BK_BracedInit)) {
424	return true;
425	}
426
427	// Continued braced list.
428	if (ScopeStart > Start + `1` &&
429	Changes [ScopeStart - `2`].Tok->isNot(Kind: tok::identifier) &&
430	Changes [ScopeStart - `1`].Tok->is(Kind: tok::l_brace) &&
431	CurrentChange.Tok->isNot(Kind: tok::r_brace)) {
432	for (unsigned OuterScopeStart : llvm::reverse(C&: ScopeStack)) {
433	// Lambda.
434	if (OuterScopeStart > Start &&
435	Changes [OuterScopeStart - `1`].Tok->is(TT: TT_LambdaLBrace)) {
436	return false;
437	}
438	}
439	if (Changes [ScopeStart].NewlinesBefore > `0`)
440	return false;
441	return true;
442	}
443
444	// Continued template parameter.
445	if (Changes [ScopeStart - `1`].Tok->is(TT: TT_TemplateOpener))
446	return true;
447
448	return false;
449	};
450
451	if (ShouldShiftBeAdded())
452	CurrentChange.Spaces += Shift;
453	}
454
455	if (ContinuedStringLiteral)
456	CurrentChange.Spaces += Shift;
457
458	// We should not remove required spaces unless we break the line before.
459	assert(Shift > `0` \|\| Changes[i].NewlinesBefore > `0` \|\|
460	CurrentChange.Spaces >=
461	static_cast<int>(Changes[i].Tok->SpacesRequiredBefore) \|\|
462	CurrentChange.Tok->is(tok::eof));
463
464	CurrentChange.StartOfTokenColumn += Shift;
465	if (i + `1` != Changes.size())
466	Changes [i + `1`].PreviousEndOfTokenColumn += Shift;
467
468	// If PointerAlignment is PAS_Right, keep s or &s next to the token,*
469	// except if the token is equal, then a space is needed.
470	if ((Style.PointerAlignment == FormatStyle::PAS_Right \|\|
471	Style.ReferenceAlignment == FormatStyle::RAS_Right) &&
472	CurrentChange.Spaces != `0` &&
473	!CurrentChange.Tok->isOneOf(K1: tok::equal, K2: tok::r_paren,
474	Ks: TT_TemplateCloser)) {
475	const bool ReferenceNotRightAligned =
476	Style.ReferenceAlignment != FormatStyle::RAS_Right &&
477	Style.ReferenceAlignment != FormatStyle::RAS_Pointer;
478	for (int Previous = i - `1`;
479	Previous >= `0` && Changes [Previous].Tok->is(TT: TT_PointerOrReference);
480	--Previous) {
481	assert(Changes[Previous].Tok->isPointerOrReference());
482	if (Changes [Previous].Tok->isNot(Kind: tok::star)) {
483	if (ReferenceNotRightAligned)
484	continue;
485	} else if (Style.PointerAlignment != FormatStyle::PAS_Right) {
486	continue;
487	}
488	Changes [Previous + `1`].Spaces -= Shift;
489	Changes [Previous].Spaces += Shift;
490	Changes [Previous].StartOfTokenColumn += Shift;
491	}
492	}
493	}
494	}
495
496	// Walk through a subset of the changes, starting at StartAt, and find
497	// sequences of matching tokens to align. To do so, keep track of the lines and
498	// whether or not a matching token was found on a line. If a matching token is
499	// found, extend the current sequence. If the current line cannot be part of a
500	// sequence, e.g. because there is an empty line before it or it contains only
501	// non-matching tokens, finalize the previous sequence.
502	// The value returned is the token on which we stopped, either because we
503	// exhausted all items inside Changes, or because we hit a scope level higher
504	// than our initial scope.
505	// This function is recursive. Each invocation processes only the scope level
506	// equal to the initial level, which is the level of Changes[StartAt].
507	// If we encounter a scope level greater than the initial level, then we call
508	// ourselves recursively, thereby avoiding the pollution of the current state
509	// with the alignment requirements of the nested sub-level. This recursive
510	// behavior is necessary for aligning function prototypes that have one or more
511	// arguments.
512	// If this function encounters a scope level less than the initial level,
513	// it returns the current position.
514	// There is a non-obvious subtlety in the recursive behavior: Even though we
515	// defer processing of nested levels to recursive invocations of this
516	// function, when it comes time to align a sequence of tokens, we run the
517	// alignment on the entire sequence, including the nested levels.
518	// When doing so, most of the nested tokens are skipped, because their
519	// alignment was already handled by the recursive invocations of this function.
520	// However, the special exception is that we do NOT skip function parameters
521	// that are split across multiple lines. See the test case in FormatTest.cpp
522	// that mentions "split function parameter alignment" for an example of this.
523	// When the parameter RightJustify is true, the operator will be
524	// right-justified. It is used to align compound assignments like `+=` and `=`.
525	// When RightJustify and ACS.PadOperators are true, operators in each block to
526	// be aligned will be padded on the left to the same length before aligning.
527	template <typename F>
528	static unsigned AlignTokens(const FormatStyle &Style, F &&Matches,
529	SmallVector<WhitespaceManager::Change, `16`> &Changes,
530	unsigned StartAt,
531	const FormatStyle::AlignConsecutiveStyle &ACS = {},
532	bool RightJustify = false) {
533	// We arrange each line in 3 parts. The operator to be aligned (the anchor),
534	// and text to its left and right. In the aligned text the width of each part
535	// will be the maximum of that over the block that has been aligned. Maximum
536	// widths of each part so far. When RightJustify is true and ACS.PadOperators
537	// is false, the part from start of line to the right end of the anchor.
538	// Otherwise, only the part to the left of the anchor. Including the space
539	// that exists on its left from the start. Not including the padding added on
540	// the left to right-justify the anchor.
541	unsigned WidthLeft = `0`;
542	// The operator to be aligned when RightJustify is true and ACS.PadOperators
543	// is false. 0 otherwise.
544	unsigned WidthAnchor = `0`;
545	// Width to the right of the anchor. Plus width of the anchor when
546	// RightJustify is false.
547	unsigned WidthRight = `0`;
548
549	// Line number of the start and the end of the current token sequence.
550	unsigned StartOfSequence = `0`;
551	unsigned EndOfSequence = `0`;
552
553	// Measure the scope level (i.e. depth of (), [], {}) of the first token, and
554	// abort when we hit any token in a higher scope than the starting one.
555	auto IndentAndNestingLevel = StartAt < Changes.size()
556	? Changes [StartAt].indentAndNestingLevel()
557	: std::tuple<unsigned, unsigned, unsigned>();
558
559	// Keep track of the number of commas before the matching tokens, we will only
560	// align a sequence of matching tokens if they are preceded by the same number
561	// of commas.
562	unsigned CommasBeforeLastMatch = `0`;
563	unsigned CommasBeforeMatch = `0`;
564
565	// Whether a matching token has been found on the current line.
566	bool FoundMatchOnLine = false;
567
568	// Whether the current line consists purely of comments.
569	bool LineIsComment = true;
570
571	// Aligns a sequence of matching tokens, on the MinColumn column.
572	//
573	// Sequences start from the first matching token to align, and end at the
574	// first token of the first line that doesn't need to be aligned.
575	//
576	// We need to adjust the StartOfTokenColumn of each Change that is on a line
577	// containing any matching token to be aligned and located after such token.
578	auto AlignCurrentSequence = [&] {
579	if (StartOfSequence > `0` && StartOfSequence < EndOfSequence) {
580	AlignTokenSequence(Style, StartOfSequence, EndOfSequence,
581	WidthLeft + WidthAnchor, RightJustify, Matches,
582	Changes);
583	}
584	WidthLeft = `0`;
585	WidthAnchor = `0`;
586	WidthRight = `0`;
587	StartOfSequence = `0`;
588	EndOfSequence = `0`;
589	};
590
591	unsigned i = StartAt;
592	for (unsigned e = Changes.size(); i != e; ++i) {
593	auto &CurrentChange = Changes [i];
594	if (CurrentChange.indentAndNestingLevel() < IndentAndNestingLevel)
595	break;
596
597	if (CurrentChange.NewlinesBefore != `0`) {
598	CommasBeforeMatch = `0`;
599	EndOfSequence = i;
600
601	// Whether to break the alignment sequence because of an empty line.
602	bool EmptyLineBreak =
603	(CurrentChange.NewlinesBefore > `1`) && !ACS.AcrossEmptyLines;
604
605	// Whether to break the alignment sequence because of a line without a
606	// match.
607	bool NoMatchBreak =
608	!FoundMatchOnLine && !(LineIsComment && ACS.AcrossComments);
609
610	if (EmptyLineBreak \|\| NoMatchBreak)
611	AlignCurrentSequence();
612
613	// A new line starts, re-initialize line status tracking bools.
614	// Keep the match state if a string literal is continued on this line.
615	if (i == `0` \|\| CurrentChange.Tok->isNot(Kind: tok::string_literal) \|\|
616	Changes [i - `1`].Tok->isNot(Kind: tok::string_literal)) {
617	FoundMatchOnLine = false;
618	}
619	LineIsComment = true;
620	}
621
622	if (CurrentChange.Tok->isNot(Kind: tok::comment))
623	LineIsComment = false;
624
625	if (CurrentChange.Tok->is(Kind: tok::comma)) {
626	++CommasBeforeMatch;
627	} else if (CurrentChange.indentAndNestingLevel() > IndentAndNestingLevel) {
628	// Call AlignTokens recursively, skipping over this scope block.
629	unsigned StoppedAt =
630	AlignTokens(Style, Matches, Changes, i, ACS, RightJustify);
631	i = StoppedAt - `1`;
632	continue;
633	}
634
635	if (!Matches(CurrentChange))
636	continue;
637
638	// If there is more than one matching token per line, or if the number of
639	// preceding commas, do not match anymore, end the sequence.
640	if (FoundMatchOnLine \|\| CommasBeforeMatch != CommasBeforeLastMatch)
641	AlignCurrentSequence();
642
643	CommasBeforeLastMatch = CommasBeforeMatch;
644	FoundMatchOnLine = true;
645
646	if (StartOfSequence == `0`)
647	StartOfSequence = i;
648
649	unsigned ChangeWidthLeft = CurrentChange.StartOfTokenColumn;
650	unsigned ChangeWidthAnchor = `0`;
651	unsigned ChangeWidthRight = `0`;
652	if (RightJustify)
653	if (ACS.PadOperators)
654	ChangeWidthAnchor = CurrentChange.TokenLength;
655	else
656	ChangeWidthLeft += CurrentChange.TokenLength;
657	else
658	ChangeWidthRight = CurrentChange.TokenLength;
659	for (unsigned j = i + `1`; j != e && Changes [j].NewlinesBefore == `0`; ++j) {
660	ChangeWidthRight += Changes [j].Spaces;
661	// Changes are generally 1:1 with the tokens, but a change could also be
662	// inside of a token, in which case it's counted more than once: once for
663	// the whitespace surrounding the token (!IsInsideToken) and once for
664	// each whitespace change within it (IsInsideToken).
665	// Therefore, changes inside of a token should only count the space.
666	if (!Changes [j].IsInsideToken)
667	ChangeWidthRight += Changes [j].TokenLength;
668	}
669
670	// If we are restricted by the maximum column width, end the sequence.
671	unsigned NewLeft = std::max(a: ChangeWidthLeft, b: WidthLeft);
672	unsigned NewAnchor = std::max(a: ChangeWidthAnchor, b: WidthAnchor);
673	unsigned NewRight = std::max(a: ChangeWidthRight, b: WidthRight);
674	// `ColumnLimit == 0` means there is no column limit.
675	if (Style.ColumnLimit != `0` &&
676	Style.ColumnLimit < NewLeft + NewAnchor + NewRight) {
677	AlignCurrentSequence();
678	StartOfSequence = i;
679	WidthLeft = ChangeWidthLeft;
680	WidthAnchor = ChangeWidthAnchor;
681	WidthRight = ChangeWidthRight;
682	} else {
683	WidthLeft = NewLeft;
684	WidthAnchor = NewAnchor;
685	WidthRight = NewRight;
686	}
687	}
688
689	EndOfSequence = i;
690	AlignCurrentSequence();
691	return i;
692	}
693
694	// Aligns a sequence of matching tokens, on the MinColumn column.
695	//
696	// Sequences start from the first matching token to align, and end at the
697	// first token of the first line that doesn't need to be aligned.
698	//
699	// We need to adjust the StartOfTokenColumn of each Change that is on a line
700	// containing any matching token to be aligned and located after such token.
701	static void AlignMatchingTokenSequence(
702	unsigned &StartOfSequence, unsigned &EndOfSequence, unsigned &MinColumn,
703	std::function<bool(const WhitespaceManager::Change &C)> Matches,
704	SmallVector<WhitespaceManager::Change, `16`> &Changes) {
705	if (StartOfSequence > `0` && StartOfSequence < EndOfSequence) {
706	bool FoundMatchOnLine = false;
707	int Shift = `0`;
708
709	for (unsigned I = StartOfSequence; I != EndOfSequence; ++I) {
710	if (Changes [I].NewlinesBefore > `0`) {
711	Shift = `0`;
712	FoundMatchOnLine = false;
713	}
714
715	// If this is the first matching token to be aligned, remember by how many
716	// spaces it has to be shifted, so the rest of the changes on the line are
717	// shifted by the same amount.
718	if (!FoundMatchOnLine && Matches (Changes [I])) {
719	FoundMatchOnLine = true;
720	Shift = MinColumn - Changes [I].StartOfTokenColumn;
721	Changes [I].Spaces += Shift;
722	}
723
724	assert(Shift >= `0`);
725	Changes [I].StartOfTokenColumn += Shift;
726	if (I + `1` != Changes.size())
727	Changes [I + `1`].PreviousEndOfTokenColumn += Shift;
728	}
729	}
730
731	MinColumn = `0`;
732	StartOfSequence = `0`;
733	EndOfSequence = `0`;
734	}
735
736	void WhitespaceManager::alignConsecutiveMacros() {
737	if (!Style.AlignConsecutiveMacros.Enabled)
738	return;
739
740	auto AlignMacrosMatches = [](const Change &C) {
741	const FormatToken *Current = C.Tok;
742	unsigned SpacesRequiredBefore = `1`;
743
744	if (Current->SpacesRequiredBefore == `0` \|\| !Current->Previous)
745	return false;
746
747	Current = Current->Previous;
748
749	// If token is a ")", skip over the parameter list, to the
750	// token that precedes the "("
751	if (Current->is(Kind: tok::r_paren) && Current->MatchingParen) {
752	Current = Current->MatchingParen->Previous;
753	SpacesRequiredBefore = `0`;
754	}
755
756	if (!Current \|\| Current->isNot(Kind: tok::identifier))
757	return false;
758
759	if (!Current->Previous \|\| Current->Previous->isNot(Kind: tok::pp_define))
760	return false;
761
762	// For a macro function, 0 spaces are required between the
763	// identifier and the lparen that opens the parameter list.
764	// For a simple macro, 1 space is required between the
765	// identifier and the first token of the defined value.
766	return Current->Next->SpacesRequiredBefore == SpacesRequiredBefore;
767	};
768
769	unsigned MinColumn = `0`;
770
771	// Start and end of the token sequence we're processing.
772	unsigned StartOfSequence = `0`;
773	unsigned EndOfSequence = `0`;
774
775	// Whether a matching token has been found on the current line.
776	bool FoundMatchOnLine = false;
777
778	// Whether the current line consists only of comments
779	bool LineIsComment = true;
780
781	unsigned I = `0`;
782	for (unsigned E = Changes.size(); I != E; ++I) {
783	if (Changes [I].NewlinesBefore != `0`) {
784	EndOfSequence = I;
785
786	// Whether to break the alignment sequence because of an empty line.
787	bool EmptyLineBreak = (Changes [I].NewlinesBefore > `1`) &&
788	!Style.AlignConsecutiveMacros.AcrossEmptyLines;
789
790	// Whether to break the alignment sequence because of a line without a
791	// match.
792	bool NoMatchBreak =
793	!FoundMatchOnLine &&
794	!(LineIsComment && Style.AlignConsecutiveMacros.AcrossComments);
795
796	if (EmptyLineBreak \|\| NoMatchBreak) {
797	AlignMatchingTokenSequence(StartOfSequence, EndOfSequence, MinColumn,
798	Matches: AlignMacrosMatches, Changes);
799	}
800
801	// A new line starts, re-initialize line status tracking bools.
802	FoundMatchOnLine = false;
803	LineIsComment = true;
804	}
805
806	if (Changes [I].Tok->isNot(Kind: tok::comment))
807	LineIsComment = false;
808
809	if (!AlignMacrosMatches (Changes [I]))
810	continue;
811
812	FoundMatchOnLine = true;
813
814	if (StartOfSequence == `0`)
815	StartOfSequence = I;
816
817	unsigned ChangeMinColumn = Changes [I].StartOfTokenColumn;
818	MinColumn = std::max(a: MinColumn, b: ChangeMinColumn);
819	}
820
821	EndOfSequence = I;
822	AlignMatchingTokenSequence(StartOfSequence, EndOfSequence, MinColumn,
823	Matches: AlignMacrosMatches, Changes);
824	}
825
826	void WhitespaceManager::alignConsecutiveAssignments() {
827	if (!Style.AlignConsecutiveAssignments.Enabled)
828	return;
829
830	AlignTokens(
831	Style,
832	Matches: [&](const Change &C) {
833	// Do not align on equal signs that are first on a line.
834	if (C.NewlinesBefore > `0`)
835	return false;
836
837	// Do not align on equal signs that are last on a line.
838	if (&C != &Changes.back() && (&C + `1`)->NewlinesBefore > `0`)
839	return false;
840
841	// Do not align operator= overloads.
842	FormatToken *Previous = C.Tok->getPreviousNonComment();
843	if (Previous && Previous->is(Kind: tok::kw_operator))
844	return false;
845
846	return Style.AlignConsecutiveAssignments.AlignCompound
847	? C.Tok->getPrecedence() == prec::Assignment
848	: (C.Tok->is(Kind: tok::equal) \|\|
849	// In Verilog the '<=' is not a compound assignment, thus
850	// it is aligned even when the AlignCompound option is not
851	// set.
852	(Style.isVerilog() && C.Tok->is(Kind: tok::lessequal) &&
853	C.Tok->getPrecedence() == prec::Assignment));
854	},
855	Changes, /StartAt=/`0`, ACS: Style.AlignConsecutiveAssignments,
856	/RightJustify=/true);
857	}
858
859	void WhitespaceManager::alignConsecutiveBitFields() {
860	alignConsecutiveColons(AlignStyle: Style.AlignConsecutiveBitFields, Type: TT_BitFieldColon);
861	}
862
863	void WhitespaceManager::alignConsecutiveColons(
864	const FormatStyle::AlignConsecutiveStyle &AlignStyle, TokenType Type) {
865	if (!AlignStyle.Enabled)
866	return;
867
868	AlignTokens(
869	Style,
870	Matches: [&](Change const &C) {
871	// Do not align on ':' that is first on a line.
872	if (C.NewlinesBefore > `0`)
873	return false;
874
875	// Do not align on ':' that is last on a line.
876	if (&C != &Changes.back() && (&C + `1`)->NewlinesBefore > `0`)
877	return false;
878
879	return C.Tok->is(TT: Type);
880	},
881	Changes, /StartAt=/`0`, ACS: AlignStyle);
882	}
883
884	void WhitespaceManager::alignConsecutiveShortCaseStatements(bool IsExpr) {
885	if (!Style.AlignConsecutiveShortCaseStatements.Enabled \|\|
886	!(IsExpr ? Style.AllowShortCaseExpressionOnASingleLine
887	: Style.AllowShortCaseLabelsOnASingleLine)) {
888	return;
889	}
890
891	const auto Type = IsExpr ? TT_CaseLabelArrow : TT_CaseLabelColon;
892	const auto &Option = Style.AlignConsecutiveShortCaseStatements;
893	const bool AlignArrowOrColon =
894	IsExpr ? Option.AlignCaseArrows : Option.AlignCaseColons;
895
896	auto Matches = [&](const Change &C) {
897	if (AlignArrowOrColon)
898	return C.Tok->is(TT: Type);
899
900	// Ignore 'IsInsideToken' to allow matching trailing comments which
901	// need to be reflowed as that causes the token to appear in two
902	// different changes, which will cause incorrect alignment as we'll
903	// reflow early due to detecting multiple aligning tokens per line.
904	return !C.IsInsideToken && C.Tok->Previous && C.Tok->Previous->is(TT: Type);
905	};
906
907	unsigned MinColumn = `0`;
908
909	// Empty case statements don't break the alignment, but don't necessarily
910	// match our predicate, so we need to track their column so they can push out
911	// our alignment.
912	unsigned MinEmptyCaseColumn = `0`;
913
914	// Start and end of the token sequence we're processing.
915	unsigned StartOfSequence = `0`;
916	unsigned EndOfSequence = `0`;
917
918	// Whether a matching token has been found on the current line.
919	bool FoundMatchOnLine = false;
920
921	bool LineIsComment = true;
922	bool LineIsEmptyCase = false;
923
924	unsigned I = `0`;
925	for (unsigned E = Changes.size(); I != E; ++I) {
926	if (Changes [I].NewlinesBefore != `0`) {
927	// Whether to break the alignment sequence because of an empty line.
928	bool EmptyLineBreak =
929	(Changes [I].NewlinesBefore > `1`) &&
930	!Style.AlignConsecutiveShortCaseStatements.AcrossEmptyLines;
931
932	// Whether to break the alignment sequence because of a line without a
933	// match.
934	bool NoMatchBreak =
935	!FoundMatchOnLine &&
936	!(LineIsComment &&
937	Style.AlignConsecutiveShortCaseStatements.AcrossComments) &&
938	!LineIsEmptyCase;
939
940	if (EmptyLineBreak \|\| NoMatchBreak) {
941	AlignMatchingTokenSequence(StartOfSequence, EndOfSequence, MinColumn,
942	Matches, Changes);
943	MinEmptyCaseColumn = `0`;
944	}
945
946	// A new line starts, re-initialize line status tracking bools.
947	FoundMatchOnLine = false;
948	LineIsComment = true;
949	LineIsEmptyCase = false;
950	}
951
952	if (Changes [I].Tok->isNot(Kind: tok::comment))
953	LineIsComment = false;
954
955	if (Changes [I].Tok->is(TT: Type)) {
956	LineIsEmptyCase =
957	!Changes [I].Tok->Next \|\| Changes [I].Tok->Next->isTrailingComment();
958
959	if (LineIsEmptyCase) {
960	if (Style.AlignConsecutiveShortCaseStatements.AlignCaseColons) {
961	MinEmptyCaseColumn =
962	std::max(a: MinEmptyCaseColumn, b: Changes [I].StartOfTokenColumn);
963	} else {
964	MinEmptyCaseColumn =
965	std::max(a: MinEmptyCaseColumn, b: Changes [I].StartOfTokenColumn + `2`);
966	}
967	}
968	}
969
970	if (!Matches (Changes [I]))
971	continue;
972
973	if (LineIsEmptyCase)
974	continue;
975
976	FoundMatchOnLine = true;
977
978	if (StartOfSequence == `0`)
979	StartOfSequence = I;
980
981	EndOfSequence = I + `1`;
982
983	MinColumn = std::max(a: MinColumn, b: Changes [I].StartOfTokenColumn);
984
985	// Allow empty case statements to push out our alignment.
986	MinColumn = std::max(a: MinColumn, b: MinEmptyCaseColumn);
987	}
988
989	AlignMatchingTokenSequence(StartOfSequence, EndOfSequence, MinColumn, Matches,
990	Changes);
991	}
992
993	void WhitespaceManager::alignConsecutiveTableGenBreakingDAGArgColons() {
994	alignConsecutiveColons(AlignStyle: Style.AlignConsecutiveTableGenBreakingDAGArgColons,
995	Type: TT_TableGenDAGArgListColonToAlign);
996	}
997
998	void WhitespaceManager::alignConsecutiveTableGenCondOperatorColons() {
999	alignConsecutiveColons(AlignStyle: Style.AlignConsecutiveTableGenCondOperatorColons,
1000	Type: TT_TableGenCondOperatorColon);
1001	}
1002
1003	void WhitespaceManager::alignConsecutiveTableGenDefinitions() {
1004	alignConsecutiveColons(AlignStyle: Style.AlignConsecutiveTableGenDefinitionColons,
1005	Type: TT_InheritanceColon);
1006	}
1007
1008	void WhitespaceManager::alignConsecutiveDeclarations() {
1009	if (!Style.AlignConsecutiveDeclarations.Enabled)
1010	return;
1011
1012	AlignTokens(
1013	Style,
1014	Matches: [&](Change const &C) {
1015	if (Style.AlignConsecutiveDeclarations.AlignFunctionPointers) {
1016	for (const auto *Prev = C.Tok->Previous; Prev; Prev = Prev->Previous)
1017	if (Prev->is(Kind: tok::equal))
1018	return false;
1019	if (C.Tok->is(TT: TT_FunctionTypeLParen))
1020	return true;
1021	}
1022	if (C.Tok->is(TT: TT_FunctionDeclarationName))
1023	return true;
1024	if (C.Tok->isNot(Kind: TT_StartOfName))
1025	return false;
1026	if (C.Tok->Previous &&
1027	C.Tok->Previous->is(TT: TT_StatementAttributeLikeMacro))
1028	return false;
1029	// Check if there is a subsequent name that starts the same declaration.
1030	for (FormatToken *Next = C.Tok->Next; Next; Next = Next->Next) {
1031	if (Next->is(Kind: tok::comment))
1032	continue;
1033	if (Next->is(TT: TT_PointerOrReference))
1034	return false;
1035	if (!Next->Tok.getIdentifierInfo())
1036	break;
1037	if (Next->isOneOf(K1: TT_StartOfName, K2: TT_FunctionDeclarationName,
1038	Ks: tok::kw_operator)) {
1039	return false;
1040	}
1041	}
1042	return true;
1043	},
1044	Changes, /StartAt=/`0`, ACS: Style.AlignConsecutiveDeclarations);
1045	}
1046
1047	void WhitespaceManager::alignChainedConditionals() {
1048	if (Style.BreakBeforeTernaryOperators) {
1049	AlignTokens(
1050	Style,
1051	Matches: [](Change const &C) {
1052	// Align question operators and last colon
1053	return C.Tok->is(TT: TT_ConditionalExpr) &&
1054	((C.Tok->is(Kind: tok::question) && !C.NewlinesBefore) \|\|
1055	(C.Tok->is(Kind: tok::colon) && C.Tok->Next &&
1056	(C.Tok->Next->FakeLParens.size() == `0` \|\|
1057	C.Tok->Next->FakeLParens.back() != prec::Conditional)));
1058	},
1059	Changes, /StartAt=/`0`);
1060	} else {
1061	static auto AlignWrappedOperand = [](Change const &C) {
1062	FormatToken *Previous = C.Tok->getPreviousNonComment();
1063	return C.NewlinesBefore && Previous && Previous->is(TT: TT_ConditionalExpr) &&
1064	(Previous->is(Kind: tok::colon) &&
1065	(C.Tok->FakeLParens.size() == `0` \|\|
1066	C.Tok->FakeLParens.back() != prec::Conditional));
1067	};
1068	// Ensure we keep alignment of wrapped operands with non-wrapped operands
1069	// Since we actually align the operators, the wrapped operands need the
1070	// extra offset to be properly aligned.
1071	for (Change &C : Changes)
1072	if (AlignWrappedOperand (C))
1073	C.StartOfTokenColumn -= `2`;
1074	AlignTokens(
1075	Style,
1076	Matches: [this](Change const &C) {
1077	// Align question operators if next operand is not wrapped, as
1078	// well as wrapped operands after question operator or last
1079	// colon in conditional sequence
1080	return (C.Tok->is(TT: TT_ConditionalExpr) && C.Tok->is(Kind: tok::question) &&
1081	&C != &Changes.back() && (&C + `1`)->NewlinesBefore == `0` &&
1082	!(&C + `1`)->IsTrailingComment) \|\|
1083	AlignWrappedOperand (C);
1084	},
1085	Changes, /StartAt=/`0`);
1086	}
1087	}
1088
1089	void WhitespaceManager::alignTrailingComments() {
1090	if (Style.AlignTrailingComments.Kind == FormatStyle::TCAS_Never)
1091	return;
1092
1093	const int Size = Changes.size();
1094	int MinColumn = `0`;
1095	int StartOfSequence = `0`;
1096	bool BreakBeforeNext = false;
1097	int NewLineThreshold = `1`;
1098	if (Style.AlignTrailingComments.Kind == FormatStyle::TCAS_Always)
1099	NewLineThreshold = Style.AlignTrailingComments.OverEmptyLines + `1`;
1100
1101	for (int I = `0`, MaxColumn = INT_MAX, Newlines = `0`; I < Size; ++I) {
1102	auto &C = Changes [I];
1103	if (C.StartOfBlockComment)
1104	continue;
1105	Newlines += C.NewlinesBefore;
1106	if (!C.IsTrailingComment)
1107	continue;
1108
1109	if (Style.AlignTrailingComments.Kind == FormatStyle::TCAS_Leave) {
1110	const int OriginalSpaces =
1111	C.OriginalWhitespaceRange.getEnd().getRawEncoding() -
1112	C.OriginalWhitespaceRange.getBegin().getRawEncoding() -
1113	C.Tok->LastNewlineOffset;
1114	assert(OriginalSpaces >= `0`);
1115	const auto RestoredLineLength =
1116	C.StartOfTokenColumn + C.TokenLength + OriginalSpaces;
1117	// If leaving comments makes the line exceed the column limit, give up to
1118	// leave the comments.
1119	if (RestoredLineLength >= Style.ColumnLimit && Style.ColumnLimit > `0`)
1120	break;
1121	C.Spaces = C.NewlinesBefore > `0` ? C.Tok->OriginalColumn : OriginalSpaces;
1122	continue;
1123	}
1124
1125	const int ChangeMinColumn = C.StartOfTokenColumn;
1126	int ChangeMaxColumn;
1127
1128	// If we don't create a replacement for this change, we have to consider
1129	// it to be immovable.
1130	if (!C.CreateReplacement)
1131	ChangeMaxColumn = ChangeMinColumn;
1132	else if (Style.ColumnLimit == `0`)
1133	ChangeMaxColumn = INT_MAX;
1134	else if (Style.ColumnLimit >= C.TokenLength)
1135	ChangeMaxColumn = Style.ColumnLimit - C.TokenLength;
1136	else
1137	ChangeMaxColumn = ChangeMinColumn;
1138
1139	if (I + `1` < Size && Changes [I + `1`].ContinuesPPDirective &&
1140	ChangeMaxColumn >= `2`) {
1141	ChangeMaxColumn -= `2`;
1142	}
1143
1144	bool WasAlignedWithStartOfNextLine = false;
1145	if (C.NewlinesBefore >= `1`) { // A comment on its own line.
1146	const auto CommentColumn =
1147	SourceMgr.getSpellingColumnNumber(Loc: C.OriginalWhitespaceRange.getEnd());
1148	for (int J = I + `1`; J < Size; ++J) {
1149	if (Changes [J].Tok->is(Kind: tok::comment))
1150	continue;
1151
1152	const auto NextColumn = SourceMgr.getSpellingColumnNumber(
1153	Loc: Changes [J].OriginalWhitespaceRange.getEnd());
1154	// The start of the next token was previously aligned with the
1155	// start of this comment.
1156	WasAlignedWithStartOfNextLine =
1157	CommentColumn == NextColumn \|\|
1158	CommentColumn == NextColumn + Style.IndentWidth;
1159	break;
1160	}
1161	}
1162
1163	// We don't want to align comments which end a scope, which are here
1164	// identified by most closing braces.
1165	auto DontAlignThisComment = [](const auto *Tok) {
1166	if (Tok->is(tok::semi)) {
1167	Tok = Tok->getPreviousNonComment();
1168	if (!Tok)
1169	return false;
1170	}
1171	if (Tok->is(tok::r_paren)) {
1172	// Back up past the parentheses and a `TT_DoWhile` that may precede.
1173	Tok = Tok->MatchingParen;
1174	if (!Tok)
1175	return false;
1176	Tok = Tok->getPreviousNonComment();
1177	if (!Tok)
1178	return false;
1179	if (Tok->is(TT_DoWhile)) {
1180	const auto *Prev = Tok->getPreviousNonComment();
1181	if (!Prev) {
1182	// A do-while-loop without braces.
1183	return true;
1184	}
1185	Tok = Prev;
1186	}
1187	}
1188
1189	if (Tok->isNot(tok::r_brace))
1190	return false;
1191
1192	while (Tok->Previous && Tok->Previous->is(tok::r_brace))
1193	Tok = Tok->Previous;
1194	return Tok->NewlinesBefore > `0`;
1195	};
1196
1197	if (I > `0` && C.NewlinesBefore == `0` &&
1198	DontAlignThisComment (Changes [I - `1`].Tok)) {
1199	alignTrailingComments(Start: StartOfSequence, End: I, Column: MinColumn);
1200	// Reset to initial values, but skip this change for the next alignment
1201	// pass.
1202	MinColumn = `0`;
1203	MaxColumn = INT_MAX;
1204	StartOfSequence = I + `1`;
1205	} else if (BreakBeforeNext \|\| Newlines > NewLineThreshold \|\|
1206	(ChangeMinColumn > MaxColumn \|\| ChangeMaxColumn < MinColumn) \|\|
1207	// Break the comment sequence if the previous line did not end
1208	// in a trailing comment.
1209	(C.NewlinesBefore == `1` && I > `0` &&
1210	!Changes [I - `1`].IsTrailingComment) \|\|
1211	WasAlignedWithStartOfNextLine) {
1212	alignTrailingComments(Start: StartOfSequence, End: I, Column: MinColumn);
1213	MinColumn = ChangeMinColumn;
1214	MaxColumn = ChangeMaxColumn;
1215	StartOfSequence = I;
1216	} else {
1217	MinColumn = std::max(a: MinColumn, b: ChangeMinColumn);
1218	MaxColumn = std::min(a: MaxColumn, b: ChangeMaxColumn);
1219	}
1220	BreakBeforeNext = (I == `0`) \|\| (C.NewlinesBefore > `1`) \|\|
1221	// Never start a sequence with a comment at the beginning
1222	// of the line.
1223	(C.NewlinesBefore == `1` && StartOfSequence == I);
1224	Newlines = `0`;
1225	}
1226	alignTrailingComments(Start: StartOfSequence, End: Size, Column: MinColumn);
1227	}
1228
1229	void WhitespaceManager::alignTrailingComments(unsigned Start, unsigned End,
1230	unsigned Column) {
1231	for (unsigned i = Start; i != End; ++i) {
1232	int Shift = `0`;
1233	if (Changes [i].IsTrailingComment)
1234	Shift = Column - Changes [i].StartOfTokenColumn;
1235	if (Changes [i].StartOfBlockComment) {
1236	Shift = Changes [i].IndentationOffset +
1237	Changes [i].StartOfBlockComment->StartOfTokenColumn -
1238	Changes [i].StartOfTokenColumn;
1239	}
1240	if (Shift <= `0`)
1241	continue;
1242	Changes [i].Spaces += Shift;
1243	if (i + `1` != Changes.size())
1244	Changes [i + `1`].PreviousEndOfTokenColumn += Shift;
1245	Changes [i].StartOfTokenColumn += Shift;
1246	}
1247	}
1248
1249	void WhitespaceManager::alignEscapedNewlines() {
1250	const auto Align = Style.AlignEscapedNewlines;
1251	if (Align == FormatStyle::ENAS_DontAlign)
1252	return;
1253
1254	const bool WithLastLine = Align == FormatStyle::ENAS_LeftWithLastLine;
1255	const bool AlignLeft = Align == FormatStyle::ENAS_Left \|\| WithLastLine;
1256	const auto MaxColumn = Style.ColumnLimit;
1257	unsigned MaxEndOfLine = AlignLeft ? `0` : MaxColumn;
1258	unsigned StartOfMacro = `0`;
1259	for (unsigned i = `1`, e = Changes.size(); i < e; ++i) {
1260	Change &C = Changes [i];
1261	if (C.NewlinesBefore == `0` && (!WithLastLine \|\| C.Tok->isNot(Kind: tok::eof)))
1262	continue;
1263	const bool InPPDirective = C.ContinuesPPDirective;
1264	const auto BackslashColumn = C.PreviousEndOfTokenColumn + `2`;
1265	if (InPPDirective \|\|
1266	(WithLastLine && (MaxColumn == `0` \|\| BackslashColumn <= MaxColumn))) {
1267	MaxEndOfLine = std::max(a: BackslashColumn, b: MaxEndOfLine);
1268	}
1269	if (!InPPDirective) {
1270	alignEscapedNewlines(Start: StartOfMacro + `1`, End: i, Column: MaxEndOfLine);
1271	MaxEndOfLine = AlignLeft ? `0` : MaxColumn;
1272	StartOfMacro = i;
1273	}
1274	}
1275	alignEscapedNewlines(Start: StartOfMacro + `1`, End: Changes.size(), Column: MaxEndOfLine);
1276	}
1277
1278	void WhitespaceManager::alignEscapedNewlines(unsigned Start, unsigned End,
1279	unsigned Column) {
1280	for (unsigned i = Start; i < End; ++i) {
1281	Change &C = Changes [i];
1282	if (C.NewlinesBefore > `0`) {
1283	assert(C.ContinuesPPDirective);
1284	if (C.PreviousEndOfTokenColumn + `1` > Column)
1285	C.EscapedNewlineColumn = `0`;
1286	else
1287	C.EscapedNewlineColumn = Column;
1288	}
1289	}
1290	}
1291
1292	void WhitespaceManager::alignArrayInitializers() {
1293	if (Style.AlignArrayOfStructures == FormatStyle::AIAS_None)
1294	return;
1295
1296	for (unsigned ChangeIndex = `1U`, ChangeEnd = Changes.size();
1297	ChangeIndex < ChangeEnd; ++ChangeIndex) {
1298	auto &C = Changes [ChangeIndex];
1299	if (C.Tok->IsArrayInitializer) {
1300	bool FoundComplete = false;
1301	for (unsigned InsideIndex = ChangeIndex + `1`; InsideIndex < ChangeEnd;
1302	++InsideIndex) {
1303	if (Changes [InsideIndex].Tok == C.Tok->MatchingParen) {
1304	alignArrayInitializers(Start: ChangeIndex, End: InsideIndex + `1`);
1305	ChangeIndex = InsideIndex + `1`;
1306	FoundComplete = true;
1307	break;
1308	}
1309	}
1310	if (!FoundComplete)
1311	ChangeIndex = ChangeEnd;
1312	}
1313	}
1314	}
1315
1316	void WhitespaceManager::alignArrayInitializers(unsigned Start, unsigned End) {
1317
1318	if (Style.AlignArrayOfStructures == FormatStyle::AIAS_Right)
1319	alignArrayInitializersRightJustified(CellDescs: getCells(Start, End));
1320	else if (Style.AlignArrayOfStructures == FormatStyle::AIAS_Left)
1321	alignArrayInitializersLeftJustified(CellDescs: getCells(Start, End));
1322	}
1323
1324	void WhitespaceManager::alignArrayInitializersRightJustified(
1325	CellDescriptions &&CellDescs) {
1326	if (!CellDescs.isRectangular())
1327	return;
1328
1329	const int BracePadding = Style.Cpp11BracedListStyle ? `0` : `1`;
1330	auto &Cells = CellDescs.Cells;
1331	// Now go through and fixup the spaces.
1332	auto *CellIter = Cells.begin();
1333	for (auto i = `0U`; i < CellDescs.CellCounts [`0`]; ++i, ++CellIter) {
1334	unsigned NetWidth = `0U`;
1335	if (isSplitCell(Cell: *CellIter))
1336	NetWidth = getNetWidth(Start: Cells.begin(), End: CellIter, InitialSpaces: CellDescs.InitialSpaces);
1337	auto CellWidth = getMaximumCellWidth(CellIter, NetWidth);
1338
1339	if (Changes [CellIter->Index].Tok->is(Kind: tok::r_brace)) {
1340	// So in here we want to see if there is a brace that falls
1341	// on a line that was split. If so on that line we make sure that
1342	// the spaces in front of the brace are enough.
1343	const auto *Next = CellIter;
1344	do {
1345	const FormatToken *Previous = Changes [Next->Index].Tok->Previous;
1346	if (Previous && Previous->isNot(Kind: TT_LineComment)) {
1347	Changes [Next->Index].Spaces = BracePadding;
1348	Changes [Next->Index].NewlinesBefore = `0`;
1349	}
1350	Next = Next->NextColumnElement;
1351	} while (Next);
1352	// Unless the array is empty, we need the position of all the
1353	// immediately adjacent cells
1354	if (CellIter != Cells.begin()) {
1355	auto ThisNetWidth =
1356	getNetWidth(Start: Cells.begin(), End: CellIter, InitialSpaces: CellDescs.InitialSpaces);
1357	auto MaxNetWidth = getMaximumNetWidth(
1358	CellStart: Cells.begin(), CellStop: CellIter, InitialSpaces: CellDescs.InitialSpaces,
1359	CellCount: CellDescs.CellCounts [`0`], MaxRowCount: CellDescs.CellCounts.size());
1360	if (ThisNetWidth < MaxNetWidth)
1361	Changes [CellIter->Index].Spaces = (MaxNetWidth - ThisNetWidth);
1362	auto RowCount = `1U`;
1363	auto Offset = std::distance(first: Cells.begin(), last: CellIter);
1364	for (const auto *Next = CellIter->NextColumnElement; Next;
1365	Next = Next->NextColumnElement) {
1366	if (RowCount >= CellDescs.CellCounts.size())
1367	break;
1368	auto Start = (Cells.begin() + RowCount CellDescs.CellCounts [`0`]);
1369	auto *End = Start + Offset;
1370	ThisNetWidth = getNetWidth(Start, End, InitialSpaces: CellDescs.InitialSpaces);
1371	if (ThisNetWidth < MaxNetWidth)
1372	Changes [Next->Index].Spaces = (MaxNetWidth - ThisNetWidth);
1373	++RowCount;
1374	}
1375	}
1376	} else {
1377	auto ThisWidth =
1378	calculateCellWidth(Start: CellIter->Index, End: CellIter->EndIndex, WithSpaces: true) +
1379	NetWidth;
1380	if (Changes [CellIter->Index].NewlinesBefore == `0`) {
1381	Changes [CellIter->Index].Spaces = (CellWidth - (ThisWidth + NetWidth));
1382	Changes [CellIter->Index].Spaces += (i > `0`) ? `1` : BracePadding;
1383	}
1384	alignToStartOfCell(Start: CellIter->Index, End: CellIter->EndIndex);
1385	for (const auto *Next = CellIter->NextColumnElement; Next;
1386	Next = Next->NextColumnElement) {
1387	ThisWidth =
1388	calculateCellWidth(Start: Next->Index, End: Next->EndIndex, WithSpaces: true) + NetWidth;
1389	if (Changes [Next->Index].NewlinesBefore == `0`) {
1390	Changes [Next->Index].Spaces = (CellWidth - ThisWidth);
1391	Changes [Next->Index].Spaces += (i > `0`) ? `1` : BracePadding;
1392	}
1393	alignToStartOfCell(Start: Next->Index, End: Next->EndIndex);
1394	}
1395	}
1396	}
1397	}
1398
1399	void WhitespaceManager::alignArrayInitializersLeftJustified(
1400	CellDescriptions &&CellDescs) {
1401
1402	if (!CellDescs.isRectangular())
1403	return;
1404
1405	const int BracePadding = Style.Cpp11BracedListStyle ? `0` : `1`;
1406	auto &Cells = CellDescs.Cells;
1407	// Now go through and fixup the spaces.
1408	auto *CellIter = Cells.begin();
1409	// The first cell of every row needs to be against the left brace.
1410	for (const auto *Next = CellIter; Next; Next = Next->NextColumnElement) {
1411	auto &Change = Changes [Next->Index];
1412	Change.Spaces =
1413	Change.NewlinesBefore == `0` ? BracePadding : CellDescs.InitialSpaces;
1414	}
1415	++CellIter;
1416	for (auto i = `1U`; i < CellDescs.CellCounts [`0`]; i++, ++CellIter) {
1417	auto MaxNetWidth = getMaximumNetWidth(
1418	CellStart: Cells.begin(), CellStop: CellIter, InitialSpaces: CellDescs.InitialSpaces,
1419	CellCount: CellDescs.CellCounts [`0`], MaxRowCount: CellDescs.CellCounts.size());
1420	auto ThisNetWidth =
1421	getNetWidth(Start: Cells.begin(), End: CellIter, InitialSpaces: CellDescs.InitialSpaces);
1422	if (Changes [CellIter->Index].NewlinesBefore == `0`) {
1423	Changes [CellIter->Index].Spaces =
1424	MaxNetWidth - ThisNetWidth +
1425	(Changes [CellIter->Index].Tok->isNot(Kind: tok::r_brace) ? `1`
1426	: BracePadding);
1427	}
1428	auto RowCount = `1U`;
1429	auto Offset = std::distance(first: Cells.begin(), last: CellIter);
1430	for (const auto *Next = CellIter->NextColumnElement; Next;
1431	Next = Next->NextColumnElement) {
1432	if (RowCount >= CellDescs.CellCounts.size())
1433	break;
1434	auto Start = (Cells.begin() + RowCount CellDescs.CellCounts [`0`]);
1435	auto *End = Start + Offset;
1436	auto ThisNetWidth = getNetWidth(Start, End, InitialSpaces: CellDescs.InitialSpaces);
1437	if (Changes [Next->Index].NewlinesBefore == `0`) {
1438	Changes [Next->Index].Spaces =
1439	MaxNetWidth - ThisNetWidth +
1440	(Changes [Next->Index].Tok->isNot(Kind: tok::r_brace) ? `1` : BracePadding);
1441	}
1442	++RowCount;
1443	}
1444	}
1445	}
1446
1447	bool WhitespaceManager::isSplitCell(const CellDescription &Cell) {
1448	if (Cell.HasSplit)
1449	return true;
1450	for (const auto *Next = Cell.NextColumnElement; Next;
1451	Next = Next->NextColumnElement) {
1452	if (Next->HasSplit)
1453	return true;
1454	}
1455	return false;
1456	}
1457
1458	WhitespaceManager::CellDescriptions WhitespaceManager::getCells(unsigned Start,
1459	unsigned End) {
1460
1461	unsigned Depth = `0`;
1462	unsigned Cell = `0`;
1463	SmallVector<unsigned> CellCounts;
1464	unsigned InitialSpaces = `0`;
1465	unsigned InitialTokenLength = `0`;
1466	unsigned EndSpaces = `0`;
1467	SmallVector<CellDescription> Cells;
1468	const FormatToken MatchingParen = nullptr*;
1469	for (unsigned i = Start; i < End; ++i) {
1470	auto &C = Changes [i];
1471	if (C.Tok->is(Kind: tok::l_brace))
1472	++Depth;
1473	else if (C.Tok->is(Kind: tok::r_brace))
1474	--Depth;
1475	if (Depth == `2`) {
1476	if (C.Tok->is(Kind: tok::l_brace)) {
1477	Cell = `0`;
1478	MatchingParen = C.Tok->MatchingParen;
1479	if (InitialSpaces == `0`) {
1480	InitialSpaces = C.Spaces + C.TokenLength;
1481	InitialTokenLength = C.TokenLength;
1482	auto j = i - `1`;
1483	for (; Changes [j].NewlinesBefore == `0` && j > Start; --j) {
1484	InitialSpaces += Changes [j].Spaces + Changes [j].TokenLength;
1485	InitialTokenLength += Changes [j].TokenLength;
1486	}
1487	if (C.NewlinesBefore == `0`) {
1488	InitialSpaces += Changes [j].Spaces + Changes [j].TokenLength;
1489	InitialTokenLength += Changes [j].TokenLength;
1490	}
1491	}
1492	} else if (C.Tok->is(Kind: tok::comma)) {
1493	if (!Cells.empty())
1494	Cells.back().EndIndex = i;
1495	if (const auto *Next = C.Tok->getNextNonComment();
1496	Next && Next->isNot(Kind: tok::r_brace)) { // dangling comma
1497	++Cell;
1498	}
1499	}
1500	} else if (Depth == `1`) {
1501	if (C.Tok == MatchingParen) {
1502	if (!Cells.empty())
1503	Cells.back().EndIndex = i;
1504	Cells.push_back(Elt: CellDescription{.Index: i, .Cell: ++Cell, .EndIndex: i + `1`, .HasSplit: false, .NextColumnElement: nullptr});
1505	CellCounts.push_back(Elt: C.Tok->Previous->isNot(Kind: tok::comma) ? Cell + `1`
1506	: Cell);
1507	// Go to the next non-comment and ensure there is a break in front
1508	const auto *NextNonComment = C.Tok->getNextNonComment();
1509	while (NextNonComment && NextNonComment->is(Kind: tok::comma))
1510	NextNonComment = NextNonComment->getNextNonComment();
1511	auto j = i;
1512	while (j < End && Changes [j].Tok != NextNonComment)
1513	++j;
1514	if (j < End && Changes [j].NewlinesBefore == `0` &&
1515	Changes [j].Tok->isNot(Kind: tok::r_brace)) {
1516	Changes [j].NewlinesBefore = `1`;
1517	// Account for the added token lengths
1518	Changes [j].Spaces = InitialSpaces - InitialTokenLength;
1519	}
1520	} else if (C.Tok->is(Kind: tok::comment) && C.Tok->NewlinesBefore == `0`) {
1521	// Trailing comments stay at a space past the last token
1522	C.Spaces = Changes [i - `1`].Tok->is(Kind: tok::comma) ? `1` : `2`;
1523	} else if (C.Tok->is(Kind: tok::l_brace)) {
1524	// We need to make sure that the ending braces is aligned to the
1525	// start of our initializer
1526	auto j = i - `1`;
1527	for (; j > `0` && !Changes [j].Tok->ArrayInitializerLineStart; --j)
1528	; // Nothing the loop does the work
1529	EndSpaces = Changes [j].Spaces;
1530	}
1531	} else if (Depth == `0` && C.Tok->is(Kind: tok::r_brace)) {
1532	C.NewlinesBefore = `1`;
1533	C.Spaces = EndSpaces;
1534	}
1535	if (C.Tok->StartsColumn) {
1536	// This gets us past tokens that have been split over multiple
1537	// lines
1538	bool HasSplit = false;
1539	if (Changes [i].NewlinesBefore > `0`) {
1540	// So if we split a line previously and the tail line + this token is
1541	// less then the column limit we remove the split here and just put
1542	// the column start at a space past the comma
1543	//
1544	// FIXME This if branch covers the cases where the column is not
1545	// the first column. This leads to weird pathologies like the formatting
1546	// auto foo = Items{
1547	// Section{
1548	// 0, bar(),
1549	// }
1550	// };
1551	// Well if it doesn't lead to that it's indicative that the line
1552	// breaking should be revisited. Unfortunately alot of other options
1553	// interact with this
1554	auto j = i - `1`;
1555	if ((j - `1`) > Start && Changes [j].Tok->is(Kind: tok::comma) &&
1556	Changes [j - `1`].NewlinesBefore > `0`) {
1557	--j;
1558	auto LineLimit = Changes [j].Spaces + Changes [j].TokenLength;
1559	if (LineLimit < Style.ColumnLimit) {
1560	Changes [i].NewlinesBefore = `0`;
1561	Changes [i].Spaces = `1`;
1562	}
1563	}
1564	}
1565	while (Changes [i].NewlinesBefore > `0` && Changes [i].Tok == C.Tok) {
1566	Changes [i].Spaces = InitialSpaces;
1567	++i;
1568	HasSplit = true;
1569	}
1570	if (Changes [i].Tok != C.Tok)
1571	--i;
1572	Cells.push_back(Elt: CellDescription{.Index: i, .Cell: Cell, .EndIndex: i, .HasSplit: HasSplit, .NextColumnElement: nullptr});
1573	}
1574	}
1575
1576	return linkCells(CellDesc: {.Cells: Cells, .CellCounts: CellCounts, .InitialSpaces: InitialSpaces});
1577	}
1578
1579	unsigned WhitespaceManager::calculateCellWidth(unsigned Start, unsigned End,
1580	bool WithSpaces) const {
1581	unsigned CellWidth = `0`;
1582	for (auto i = Start; i < End; i++) {
1583	if (Changes [i].NewlinesBefore > `0`)
1584	CellWidth = `0`;
1585	CellWidth += Changes [i].TokenLength;
1586	CellWidth += (WithSpaces ? Changes [i].Spaces : `0`);
1587	}
1588	return CellWidth;
1589	}
1590
1591	void WhitespaceManager::alignToStartOfCell(unsigned Start, unsigned End) {
1592	if ((End - Start) <= `1`)
1593	return;
1594	// If the line is broken anywhere in there make sure everything
1595	// is aligned to the parent
1596	for (auto i = Start + `1`; i < End; i++)
1597	if (Changes [i].NewlinesBefore > `0`)
1598	Changes [i].Spaces = Changes [Start].Spaces;
1599	}
1600
1601	WhitespaceManager::CellDescriptions
1602	WhitespaceManager::linkCells(CellDescriptions &&CellDesc) {
1603	auto &Cells = CellDesc.Cells;
1604	for (auto *CellIter = Cells.begin(); CellIter != Cells.end(); ++CellIter) {
1605	if (!CellIter->NextColumnElement && (CellIter + `1`) != Cells.end()) {
1606	for (auto *NextIter = CellIter + `1`; NextIter != Cells.end(); ++NextIter) {
1607	if (NextIter->Cell == CellIter->Cell) {
1608	CellIter->NextColumnElement = &(*NextIter);
1609	break;
1610	}
1611	}
1612	}
1613	}
1614	return std::move(CellDesc);
1615	}
1616
1617	void WhitespaceManager::generateChanges() {
1618	for (unsigned i = `0`, e = Changes.size(); i != e; ++i) {
1619	const Change &C = Changes [i];
1620	if (i > `0`) {
1621	auto Last = Changes [i - `1`].OriginalWhitespaceRange;
1622	auto New = Changes [i].OriginalWhitespaceRange;
1623	// Do not generate two replacements for the same location. As a special
1624	// case, it is allowed if there is a replacement for the empty range
1625	// between 2 tokens and another non-empty range at the start of the second
1626	// token. We didn't implement logic to combine replacements for 2
1627	// consecutive source ranges into a single replacement, because the
1628	// program works fine without it.
1629	//
1630	// We can't eliminate empty original whitespace ranges. They appear when
1631	// 2 tokens have no whitespace in between in the input. It does not
1632	// matter whether whitespace is to be added. If no whitespace is to be
1633	// added, the replacement will be empty, and it gets eliminated after this
1634	// step in storeReplacement. For example, if the input is `foo();`,
1635	// there will be a replacement for the range between every consecutive
1636	// pair of tokens.
1637	//
1638	// A replacement at the start of a token can be added by
1639	// BreakableStringLiteralUsingOperators::insertBreak when it adds braces
1640	// around the string literal. Say Verilog code is being formatted and the
1641	// first line is to become the next 2 lines.
1642	// x("long string");
1643	// x({"long ",
1644	// "string"});
1645	// There will be a replacement for the empty range between the parenthesis
1646	// and the string and another replacement for the quote character. The
1647	// replacement for the empty range between the parenthesis and the quote
1648	// comes from ContinuationIndenter::addTokenOnCurrentLine when it changes
1649	// the original empty range between the parenthesis and the string to
1650	// another empty one. The replacement for the quote character comes from
1651	// BreakableStringLiteralUsingOperators::insertBreak when it adds the
1652	// brace. In the example, the replacement for the empty range is the same
1653	// as the original text. However, eliminating replacements that are same
1654	// as the original does not help in general. For example, a newline can
1655	// be inserted, causing the first line to become the next 3 lines.
1656	// xxxxxxxxxxx("long string");
1657	// xxxxxxxxxxx(
1658	// {"long ",
1659	// "string"});
1660	// In that case, the empty range between the parenthesis and the string
1661	// will be replaced by a newline and 4 spaces. So we will still have to
1662	// deal with a replacement for an empty source range followed by a
1663	// replacement for a non-empty source range.
1664	if (Last.getBegin() == New.getBegin() &&
1665	(Last.getEnd() != Last.getBegin() \|\|
1666	New.getEnd() == New.getBegin())) {
1667	continue;
1668	}
1669	}
1670	if (C.CreateReplacement) {
1671	std::string ReplacementText = C.PreviousLinePostfix;
1672	if (C.ContinuesPPDirective) {
1673	appendEscapedNewlineText(Text&: ReplacementText, Newlines: C.NewlinesBefore,
1674	PreviousEndOfTokenColumn: C.PreviousEndOfTokenColumn,
1675	EscapedNewlineColumn: C.EscapedNewlineColumn);
1676	} else {
1677	appendNewlineText(Text&: ReplacementText, Newlines: C.NewlinesBefore);
1678	}
1679	// FIXME: This assert should hold if we computed the column correctly.
1680	// assert((int)C.StartOfTokenColumn >= C.Spaces);
1681	appendIndentText(
1682	Text&: ReplacementText, IndentLevel: C.Tok->IndentLevel, Spaces: std::max(a: `0`, b: C.Spaces),
1683	WhitespaceStartColumn: std::max(a: (int)C.StartOfTokenColumn, b: C.Spaces) - std::max(a: `0`, b: C.Spaces),
1684	IsAligned: C.IsAligned);
1685	ReplacementText.append(str: C.CurrentLinePrefix);
1686	storeReplacement(Range: C.OriginalWhitespaceRange, Text: ReplacementText);
1687	}
1688	}
1689	}
1690
1691	void WhitespaceManager::storeReplacement(SourceRange Range, StringRef Text) {
1692	unsigned WhitespaceLength = SourceMgr.getFileOffset(SpellingLoc: Range.getEnd()) -
1693	SourceMgr.getFileOffset(SpellingLoc: Range.getBegin());
1694	// Don't create a replacement, if it does not change anything.
1695	if (StringRef (SourceMgr.getCharacterData(SL: Range.getBegin()),
1696	WhitespaceLength) == Text) {
1697	return;
1698	}
1699	auto Err = Replaces.add(R: tooling::Replacement (
1700	SourceMgr, CharSourceRange::getCharRange(R: Range), Text));
1701	// FIXME: better error handling. For now, just print an error message in the
1702	// release version.
1703	if (Err) {
1704	llvm::errs() << llvm::toString(E: std::move(Err)) << "\n";
1705	assert(false);
1706	}
1707	}
1708
1709	void WhitespaceManager::appendNewlineText(std::string &Text,
1710	unsigned Newlines) {
1711	if (UseCRLF) {
1712	Text.reserve(res_arg: Text.size() + `2` * Newlines);
1713	for (unsigned i = `0`; i < Newlines; ++i)
1714	Text.append(s: "\r\n");
1715	} else {
1716	Text.append(n: Newlines, c: `'\n'`);
1717	}
1718	}
1719
1720	void WhitespaceManager::appendEscapedNewlineText(
1721	std::string &Text, unsigned Newlines, unsigned PreviousEndOfTokenColumn,
1722	unsigned EscapedNewlineColumn) {
1723	if (Newlines > `0`) {
1724	unsigned Spaces =
1725	std::max<int>(a: `1`, b: EscapedNewlineColumn - PreviousEndOfTokenColumn - `1`);
1726	for (unsigned i = `0`; i < Newlines; ++i) {
1727	Text.append(n: Spaces, c: `' '`);
1728	Text.append(s: UseCRLF ? "\\\r\n" : "\\\n");
1729	Spaces = std::max<int>(a: `0`, b: EscapedNewlineColumn - `1`);
1730	}
1731	}
1732	}
1733
1734	void WhitespaceManager::appendIndentText(std::string &Text,
1735	unsigned IndentLevel, unsigned Spaces,
1736	unsigned WhitespaceStartColumn,
1737	bool IsAligned) {
1738	switch (Style.UseTab) {
1739	case FormatStyle::UT_Never:
1740	Text.append(n: Spaces, c: `' '`);
1741	break;
1742	case FormatStyle::UT_Always: {
1743	if (Style.TabWidth) {
1744	unsigned FirstTabWidth =
1745	Style.TabWidth - WhitespaceStartColumn % Style.TabWidth;
1746
1747	// Insert only spaces when we want to end up before the next tab.
1748	if (Spaces < FirstTabWidth \|\| Spaces == `1`) {
1749	Text.append(n: Spaces, c: `' '`);
1750	break;
1751	}
1752	// Align to the next tab.
1753	Spaces -= FirstTabWidth;
1754	Text.append(s: "\t");
1755
1756	Text.append(n: Spaces / Style.TabWidth, c: `'\t'`);
1757	Text.append(n: Spaces % Style.TabWidth, c: `' '`);
1758	} else if (Spaces == `1`) {
1759	Text.append(n: Spaces, c: `' '`);
1760	}
1761	break;
1762	}
1763	case FormatStyle::UT_ForIndentation:
1764	if (WhitespaceStartColumn == `0`) {
1765	unsigned Indentation = IndentLevel * Style.IndentWidth;
1766	Spaces = appendTabIndent(Text, Spaces, Indentation);
1767	}
1768	Text.append(n: Spaces, c: `' '`);
1769	break;
1770	case FormatStyle::UT_ForContinuationAndIndentation:
1771	if (WhitespaceStartColumn == `0`)
1772	Spaces = appendTabIndent(Text, Spaces, Indentation: Spaces);
1773	Text.append(n: Spaces, c: `' '`);
1774	break;
1775	case FormatStyle::UT_AlignWithSpaces:
1776	if (WhitespaceStartColumn == `0`) {
1777	unsigned Indentation =
1778	IsAligned ? IndentLevel * Style.IndentWidth : Spaces;
1779	Spaces = appendTabIndent(Text, Spaces, Indentation);
1780	}
1781	Text.append(n: Spaces, c: `' '`);
1782	break;
1783	}
1784	}
1785
1786	unsigned WhitespaceManager::appendTabIndent(std::string &Text, unsigned Spaces,
1787	unsigned Indentation) {
1788	// This happens, e.g. when a line in a block comment is indented less than the
1789	// first one.
1790	if (Indentation > Spaces)
1791	Indentation = Spaces;
1792	if (Style.TabWidth) {
1793	unsigned Tabs = Indentation / Style.TabWidth;
1794	Text.append(n: Tabs, c: `'\t'`);
1795	Spaces -= Tabs * Style.TabWidth;
1796	}
1797	return Spaces;
1798	}
1799
1800	} // namespace format
1801	} // namespace clang
1802

Browse the source code of llvm_projects/clang/lib/Format/WhitespaceManager.cpp