UnwrappedLineParser.cpp source code [llvm_projects/clang/lib/Format/UnwrappedLineParser.cpp]

1	//===--- UnwrappedLineParser.cpp - Format C++ code ------------------------===//
2	//
3	// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4	// See https://llvm.org/LICENSE.txt for license information.
5	// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6	//
7	//===----------------------------------------------------------------------===//
8	///
9	/// \file
10	/// This file contains the implementation of the UnwrappedLineParser,
11	/// which turns a stream of tokens into UnwrappedLines.
12	///
13	//===----------------------------------------------------------------------===//
14
15	#include "UnwrappedLineParser.h"
16	#include "FormatToken.h"
17	#include "FormatTokenSource.h"
18	#include "Macros.h"
19	#include "TokenAnnotator.h"
20	#include "clang/Basic/TokenKinds.h"
21	#include "llvm/ADT/STLExtras.h"
22	#include "llvm/ADT/StringRef.h"
23	#include "llvm/Support/Debug.h"
24	#include "llvm/Support/raw_os_ostream.h"
25	#include "llvm/Support/raw_ostream.h"
26
27	#include <utility>
28
29	#define DEBUG_TYPE "format-parser"
30
31	namespace clang {
32	namespace format {
33
34	namespace {
35
36	void printLine(llvm::raw_ostream &OS, const UnwrappedLine &Line,
37	StringRef Prefix = "", bool PrintText = false) {
38	OS << Prefix << "Line(" << Line.Level << ", FSC=" << Line.FirstStartColumn
39	<< ")" << (Line.InPPDirective ? " MACRO" : "") << ": ";
40	bool NewLine = false;
41	for (std::list<UnwrappedLineNode>::const_iterator I = Line.Tokens.begin(),
42	E = Line.Tokens.end();
43	I != E; ++I) {
44	if (NewLine) {
45	OS << Prefix;
46	NewLine = false;
47	}
48	OS << I ->Tok->Tok.getName() << "["
49	<< "T=" << (unsigned)I ->Tok->getType()
50	<< ", OC=" << I ->Tok->OriginalColumn << ", \"" << I ->Tok->TokenText
51	<< "\"] ";
52	for (const auto CI = I ->Children.begin(), CE = I ->Children.end();
53	CI != CE; ++CI) {
54	OS << "\n";
55	printLine(OS, Line: *CI, Prefix: (Prefix + " ").str());
56	NewLine = true;
57	}
58	}
59	if (!NewLine)
60	OS << "\n";
61	}
62
63	LLVM_ATTRIBUTE_UNUSED static void printDebugInfo(const UnwrappedLine &Line) {
64	printLine(OS&: llvm::dbgs(), Line);
65	}
66
67	class ScopedDeclarationState {
68	public:
69	ScopedDeclarationState(UnwrappedLine &Line, llvm::BitVector &Stack,
70	bool MustBeDeclaration)
71	: Line(Line), Stack(Stack) {
72	Line.MustBeDeclaration = MustBeDeclaration;
73	Stack.push_back(Val: MustBeDeclaration);
74	}
75	~ScopedDeclarationState() {
76	Stack.pop_back();
77	if (!Stack.empty())
78	Line.MustBeDeclaration = Stack.back();
79	else
80	Line.MustBeDeclaration = true;
81	}
82
83	private:
84	UnwrappedLine &Line;
85	llvm::BitVector &Stack;
86	};
87
88	} // end anonymous namespace
89
90	std::ostream &operator<<(std::ostream &Stream, const UnwrappedLine &Line) {
91	llvm::raw_os_ostream OS(Stream);
92	printLine(OS, Line);
93	return Stream;
94	}
95
96	class ScopedLineState {
97	public:
98	ScopedLineState(UnwrappedLineParser &Parser,
99	bool SwitchToPreprocessorLines = false)
100	: Parser(Parser), OriginalLines(Parser.CurrentLines) {
101	if (SwitchToPreprocessorLines)
102	Parser.CurrentLines = &Parser.PreprocessorDirectives;
103	else if (!Parser.Line ->Tokens.empty())
104	Parser.CurrentLines = &Parser.Line ->Tokens.back().Children;
105	PreBlockLine = std::move(Parser.Line);
106	Parser.Line = std::make_unique<UnwrappedLine>();
107	Parser.Line ->Level = PreBlockLine ->Level;
108	Parser.Line ->PPLevel = PreBlockLine ->PPLevel;
109	Parser.Line ->InPPDirective = PreBlockLine ->InPPDirective;
110	Parser.Line ->InMacroBody = PreBlockLine ->InMacroBody;
111	Parser.Line ->UnbracedBodyLevel = PreBlockLine ->UnbracedBodyLevel;
112	}
113
114	~ScopedLineState() {
115	if (!Parser.Line ->Tokens.empty())
116	Parser.addUnwrappedLine();
117	assert(Parser.Line->Tokens.empty());
118	Parser.Line = std::move(PreBlockLine);
119	if (Parser.CurrentLines == &Parser.PreprocessorDirectives)
120	Parser.AtEndOfPPLine = true;
121	Parser.CurrentLines = OriginalLines;
122	}
123
124	private:
125	UnwrappedLineParser &Parser;
126
127	std::unique_ptr<UnwrappedLine> PreBlockLine;
128	SmallVectorImpl<UnwrappedLine> *OriginalLines;
129	};
130
131	class CompoundStatementIndenter {
132	public:
133	CompoundStatementIndenter(UnwrappedLineParser *Parser,
134	const FormatStyle &Style, unsigned &LineLevel)
135	: CompoundStatementIndenter (Parser, LineLevel,
136	Style.BraceWrapping.AfterControlStatement ==
137	FormatStyle::BWACS_Always,
138	Style.BraceWrapping.IndentBraces) {}
139	CompoundStatementIndenter(UnwrappedLineParser Parser, unsigned* &LineLevel,
140	bool WrapBrace, bool IndentBrace)
141	: LineLevel(LineLevel), OldLineLevel(LineLevel) {
142	if (WrapBrace)
143	Parser->addUnwrappedLine();
144	if (IndentBrace)
145	++LineLevel;
146	}
147	~CompoundStatementIndenter() { LineLevel = OldLineLevel; }
148
149	private:
150	unsigned &LineLevel;
151	unsigned OldLineLevel;
152	};
153
154	UnwrappedLineParser::UnwrappedLineParser(
155	SourceManager &SourceMgr, const FormatStyle &Style,
156	const AdditionalKeywords &Keywords, unsigned FirstStartColumn,
157	ArrayRef<FormatToken *> Tokens, UnwrappedLineConsumer &Callback,
158	llvm::SpecificBumpPtrAllocator<FormatToken> &Allocator,
159	IdentifierTable &IdentTable)
160	: Line (new UnwrappedLine), AtEndOfPPLine(false), CurrentLines(&Lines),
161	Style(Style), IsCpp(Style.isCpp()),
162	LangOpts(getFormattingLangOpts(Style)), Keywords(Keywords),
163	CommentPragmasRegex (Style.CommentPragmas), Tokens(nullptr),
164	Callback(Callback), AllTokens (Tokens), PPBranchLevel(-`1`),
165	IncludeGuard(Style.IndentPPDirectives == FormatStyle::PPDIS_None
166	? IG_Rejected
167	: IG_Inited),
168	IncludeGuardToken(nullptr), FirstStartColumn(FirstStartColumn),
169	Macros (Style.Macros, SourceMgr, Style, Allocator, IdentTable) {}
170
171	void UnwrappedLineParser::reset() {
172	PPBranchLevel = -`1`;
173	IncludeGuard = Style.IndentPPDirectives == FormatStyle::PPDIS_None
174	? IG_Rejected
175	: IG_Inited;
176	IncludeGuardToken = nullptr;
177	Line.reset(p: new UnwrappedLine);
178	CommentsBeforeNextToken.clear();
179	FormatTok = nullptr;
180	AtEndOfPPLine = false;
181	IsDecltypeAutoFunction = false;
182	PreprocessorDirectives.clear();
183	CurrentLines = &Lines;
184	DeclarationScopeStack.clear();
185	NestedTooDeep.clear();
186	NestedLambdas.clear();
187	PPStack.clear();
188	Line ->FirstStartColumn = FirstStartColumn;
189
190	if (!Unexpanded.empty())
191	for (FormatToken *Token : AllTokens)
192	Token->MacroCtx.reset();
193	CurrentExpandedLines.clear();
194	ExpandedLines.clear();
195	Unexpanded.clear();
196	InExpansion = false;
197	Reconstruct.reset();
198	}
199
200	void UnwrappedLineParser::parse() {
201	IndexedTokenSource TokenSource(AllTokens);
202	Line ->FirstStartColumn = FirstStartColumn;
203	do {
204	LLVM_DEBUG(llvm::dbgs() << "----\n");
205	reset();
206	Tokens = &TokenSource;
207	TokenSource.reset();
208
209	readToken();
210	parseFile();
211
212	// If we found an include guard then all preprocessor directives (other than
213	// the guard) are over-indented by one.
214	if (IncludeGuard == IG_Found) {
215	for (auto &Line : Lines)
216	if (Line.InPPDirective && Line.Level > `0`)
217	--Line.Level;
218	}
219
220	// Create line with eof token.
221	assert(eof());
222	pushToken(Tok: FormatTok);
223	addUnwrappedLine();
224
225	// In a first run, format everything with the lines containing macro calls
226	// replaced by the expansion.
227	if (!ExpandedLines.empty()) {
228	LLVM_DEBUG(llvm::dbgs() << "Expanded lines:\n");
229	for (const auto &Line : Lines) {
230	if (!Line.Tokens.empty()) {
231	auto it = ExpandedLines.find(Val: Line.Tokens.begin()->Tok);
232	if (it != ExpandedLines.end()) {
233	for (const auto &Expanded : it ->second) {
234	LLVM_DEBUG(printDebugInfo(Expanded));
235	Callback.consumeUnwrappedLine(Line: Expanded);
236	}
237	continue;
238	}
239	}
240	LLVM_DEBUG(printDebugInfo(Line));
241	Callback.consumeUnwrappedLine(Line);
242	}
243	Callback.finishRun();
244	}
245
246	LLVM_DEBUG(llvm::dbgs() << "Unwrapped lines:\n");
247	for (const UnwrappedLine &Line : Lines) {
248	LLVM_DEBUG(printDebugInfo(Line));
249	Callback.consumeUnwrappedLine(Line);
250	}
251	Callback.finishRun();
252	Lines.clear();
253	while (!PPLevelBranchIndex.empty() &&
254	PPLevelBranchIndex.back() + `1` >= PPLevelBranchCount.back()) {
255	PPLevelBranchIndex.resize(N: PPLevelBranchIndex.size() - `1`);
256	PPLevelBranchCount.resize(N: PPLevelBranchCount.size() - `1`);
257	}
258	if (!PPLevelBranchIndex.empty()) {
259	++PPLevelBranchIndex.back();
260	assert(PPLevelBranchIndex.size() == PPLevelBranchCount.size());
261	assert(PPLevelBranchIndex.back() <= PPLevelBranchCount.back());
262	}
263	} while (!PPLevelBranchIndex.empty());
264	}
265
266	void UnwrappedLineParser::parseFile() {
267	// The top-level context in a file always has declarations, except for pre-
268	// processor directives and JavaScript files.
269	bool MustBeDeclaration = !Line ->InPPDirective && !Style.isJavaScript();
270	ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
271	MustBeDeclaration);
272	if (Style.isTextProto() \|\| (Style.isJson() && FormatTok->IsFirst))
273	parseBracedList();
274	else
275	parseLevel();
276	// Make sure to format the remaining tokens.
277	//
278	// LK_TextProto is special since its top-level is parsed as the body of a
279	// braced list, which does not necessarily have natural line separators such
280	// as a semicolon. Comments after the last entry that have been determined to
281	// not belong to that line, as in:
282	// key: value
283	// // endfile comment
284	// do not have a chance to be put on a line of their own until this point.
285	// Here we add this newline before end-of-file comments.
286	if (Style.isTextProto() && !CommentsBeforeNextToken.empty())
287	addUnwrappedLine();
288	flushComments(NewlineBeforeNext: true);
289	addUnwrappedLine();
290	}
291
292	void UnwrappedLineParser::parseCSharpGenericTypeConstraint() {
293	do {
294	switch (FormatTok->Tok.getKind()) {
295	case tok::l_brace:
296	case tok::semi:
297	return;
298	default:
299	if (FormatTok->is(II: Keywords.kw_where)) {
300	addUnwrappedLine();
301	nextToken();
302	parseCSharpGenericTypeConstraint();
303	break;
304	}
305	nextToken();
306	break;
307	}
308	} while (!eof());
309	}
310
311	void UnwrappedLineParser::parseCSharpAttribute() {
312	int UnpairedSquareBrackets = `1`;
313	do {
314	switch (FormatTok->Tok.getKind()) {
315	case tok::r_square:
316	nextToken();
317	--UnpairedSquareBrackets;
318	if (UnpairedSquareBrackets == `0`) {
319	addUnwrappedLine();
320	return;
321	}
322	break;
323	case tok::l_square:
324	++UnpairedSquareBrackets;
325	nextToken();
326	break;
327	default:
328	nextToken();
329	break;
330	}
331	} while (!eof());
332	}
333
334	bool UnwrappedLineParser::precededByCommentOrPPDirective() const {
335	if (!Lines.empty() && Lines.back().InPPDirective)
336	return true;
337
338	const FormatToken *Previous = Tokens->getPreviousToken();
339	return Previous && Previous->is(Kind: tok::comment) &&
340	(Previous->IsMultiline \|\| Previous->NewlinesBefore > `0`);
341	}
342
343	/// Parses a level, that is ???.
344	/// \param OpeningBrace Opening brace (\p nullptr if absent) of that level.
345	/// \param IfKind The \p if statement kind in the level.
346	/// \param IfLeftBrace The left brace of the \p if block in the level.
347	/// \returns true if a simple block of if/else/for/while, or false otherwise.
348	/// (A simple block has a single statement.)
349	bool UnwrappedLineParser::parseLevel(const FormatToken *OpeningBrace,
350	IfStmtKind *IfKind,
351	FormatToken **IfLeftBrace) {
352	const bool InRequiresExpression =
353	OpeningBrace && OpeningBrace->is(TT: TT_RequiresExpressionLBrace);
354	const bool IsPrecededByCommentOrPPDirective =
355	!Style.RemoveBracesLLVM \|\| precededByCommentOrPPDirective();
356	FormatToken IfLBrace = nullptr*;
357	bool HasDoWhile = false;
358	bool HasLabel = false;
359	unsigned StatementCount = `0`;
360	bool SwitchLabelEncountered = false;
361
362	do {
363	if (FormatTok->isAttribute()) {
364	nextToken();
365	if (FormatTok->is(Kind: tok::l_paren))
366	parseParens();
367	continue;
368	}
369	tok::TokenKind Kind = FormatTok->Tok.getKind();
370	if (FormatTok->is(TT: TT_MacroBlockBegin))
371	Kind = tok::l_brace;
372	else if (FormatTok->is(TT: TT_MacroBlockEnd))
373	Kind = tok::r_brace;
374
375	auto ParseDefault = [this, OpeningBrace, IfKind, &IfLBrace, &HasDoWhile,
376	&HasLabel, &StatementCount] {
377	parseStructuralElement(OpeningBrace, IfKind, IfLeftBrace: &IfLBrace,
378	HasDoWhile: HasDoWhile ? nullptr : &HasDoWhile,
379	HasLabel: HasLabel ? nullptr : &HasLabel);
380	++StatementCount;
381	assert(StatementCount > `0` && "StatementCount overflow!");
382	};
383
384	switch (Kind) {
385	case tok::comment:
386	nextToken();
387	addUnwrappedLine();
388	break;
389	case tok::l_brace:
390	if (InRequiresExpression) {
391	FormatTok->setFinalizedType(TT_CompoundRequirementLBrace);
392	} else if (FormatTok->Previous &&
393	FormatTok->Previous->ClosesRequiresClause) {
394	// We need the 'default' case here to correctly parse a function
395	// l_brace.
396	ParseDefault ();
397	continue;
398	}
399	if (!InRequiresExpression && FormatTok->isNot(Kind: TT_MacroBlockBegin)) {
400	if (tryToParseBracedList())
401	continue;
402	FormatTok->setFinalizedType(TT_BlockLBrace);
403	}
404	parseBlock();
405	++StatementCount;
406	assert(StatementCount > `0` && "StatementCount overflow!");
407	addUnwrappedLine();
408	break;
409	case tok::r_brace:
410	if (OpeningBrace) {
411	if (!Style.RemoveBracesLLVM \|\| Line ->InPPDirective \|\|
412	!OpeningBrace->isOneOf(K1: TT_ControlStatementLBrace, K2: TT_ElseLBrace)) {
413	return false;
414	}
415	if (FormatTok->isNot(Kind: tok::r_brace) \|\| StatementCount != `1` \|\| HasLabel \|\|
416	HasDoWhile \|\| IsPrecededByCommentOrPPDirective \|\|
417	precededByCommentOrPPDirective()) {
418	return false;
419	}
420	const FormatToken *Next = Tokens->peekNextToken();
421	if (Next->is(Kind: tok::comment) && Next->NewlinesBefore == `0`)
422	return false;
423	if (IfLeftBrace)
424	*IfLeftBrace = IfLBrace;
425	return true;
426	}
427	nextToken();
428	addUnwrappedLine();
429	break;
430	case tok::kw_default: {
431	unsigned StoredPosition = Tokens->getPosition();
432	auto *Next = Tokens->getNextNonComment();
433	FormatTok = Tokens->setPosition(StoredPosition);
434	if (!Next->isOneOf(K1: tok::colon, K2: tok::arrow)) {
435	// default not followed by `:` or `->` is not a case label; treat it
436	// like an identifier.
437	parseStructuralElement();
438	break;
439	}
440	// Else, if it is 'default:', fall through to the case handling.
441	[[fallthrough]];
442	}
443	case tok::kw_case:
444	if (Style.Language == FormatStyle::LK_Proto \|\| Style.isVerilog() \|\|
445	(Style.isJavaScript() && Line ->MustBeDeclaration)) {
446	// Proto: there are no switch/case statements
447	// Verilog: Case labels don't have this word. We handle case
448	// labels including default in TokenAnnotator.
449	// JavaScript: A 'case: string' style field declaration.
450	ParseDefault ();
451	break;
452	}
453	if (!SwitchLabelEncountered &&
454	(Style.IndentCaseLabels \|\|
455	(OpeningBrace && OpeningBrace->is(TT: TT_SwitchExpressionLBrace)) \|\|
456	(Line ->InPPDirective && Line ->Level == `1`))) {
457	++Line ->Level;
458	}
459	SwitchLabelEncountered = true;
460	parseStructuralElement();
461	break;
462	case tok::l_square:
463	if (Style.isCSharp()) {
464	nextToken();
465	parseCSharpAttribute();
466	break;
467	}
468	if (handleCppAttributes())
469	break;
470	[[fallthrough]];
471	default:
472	ParseDefault ();
473	break;
474	}
475	} while (!eof());
476
477	return false;
478	}
479
480	void UnwrappedLineParser::calculateBraceTypes(bool ExpectClassBody) {
481	// We'll parse forward through the tokens until we hit
482	// a closing brace or eof - note that getNextToken() will
483	// parse macros, so this will magically work inside macro
484	// definitions, too.
485	unsigned StoredPosition = Tokens->getPosition();
486	FormatToken *Tok = FormatTok;
487	const FormatToken *PrevTok = Tok->Previous;
488	// Keep a stack of positions of lbrace tokens. We will
489	// update information about whether an lbrace starts a
490	// braced init list or a different block during the loop.
491	struct StackEntry {
492	FormatToken *Tok;
493	const FormatToken *PrevTok;
494	};
495	SmallVector<StackEntry, `8`> LBraceStack;
496	assert(Tok->is(tok::l_brace));
497
498	do {
499	auto *NextTok = Tokens->getNextNonComment();
500
501	if (!Line ->InMacroBody && !Style.isTableGen()) {
502	// Skip PPDirective lines (except macro definitions) and comments.
503	while (NextTok->is(Kind: tok::hash)) {
504	NextTok = Tokens->getNextToken();
505	if (NextTok->isOneOf(K1: tok::pp_not_keyword, K2: tok::pp_define))
506	break;
507	do {
508	NextTok = Tokens->getNextToken();
509	} while (!NextTok->HasUnescapedNewline && NextTok->isNot(Kind: tok::eof));
510
511	while (NextTok->is(Kind: tok::comment))
512	NextTok = Tokens->getNextToken();
513	}
514	}
515
516	switch (Tok->Tok.getKind()) {
517	case tok::l_brace:
518	if (Style.isJavaScript() && PrevTok) {
519	if (PrevTok->isOneOf(K1: tok::colon, K2: tok::less)) {
520	// A ':' indicates this code is in a type, or a braced list
521	// following a label in an object literal ({a: {b: 1}}).
522	// A '<' could be an object used in a comparison, but that is nonsense
523	// code (can never return true), so more likely it is a generic type
524	// argument (`X<{a: string; b: number}>`).
525	// The code below could be confused by semicolons between the
526	// individual members in a type member list, which would normally
527	// trigger BK_Block. In both cases, this must be parsed as an inline
528	// braced init.
529	Tok->setBlockKind(BK_BracedInit);
530	} else if (PrevTok->is(Kind: tok::r_paren)) {
531	// `) { }` can only occur in function or method declarations in JS.
532	Tok->setBlockKind(BK_Block);
533	}
534	} else {
535	Tok->setBlockKind(BK_Unknown);
536	}
537	LBraceStack.push_back(Elt: {.Tok: Tok, .PrevTok: PrevTok});
538	break;
539	case tok::r_brace:
540	if (LBraceStack.empty())
541	break;
542	if (auto *LBrace = LBraceStack.back().Tok; LBrace->is(BBK: BK_Unknown)) {
543	bool ProbablyBracedList = false;
544	if (Style.Language == FormatStyle::LK_Proto) {
545	ProbablyBracedList = NextTok->isOneOf(K1: tok::comma, K2: tok::r_square);
546	} else if (LBrace->isNot(Kind: TT_EnumLBrace)) {
547	// Using OriginalColumn to distinguish between ObjC methods and
548	// binary operators is a bit hacky.
549	bool NextIsObjCMethod = NextTok->isOneOf(K1: tok::plus, K2: tok::minus) &&
550	NextTok->OriginalColumn == `0`;
551
552	// Try to detect a braced list. Note that regardless how we mark inner
553	// braces here, we will overwrite the BlockKind later if we parse a
554	// braced list (where all blocks inside are by default braced lists),
555	// or when we explicitly detect blocks (for example while parsing
556	// lambdas).
557
558	// If we already marked the opening brace as braced list, the closing
559	// must also be part of it.
560	ProbablyBracedList = LBrace->is(TT: TT_BracedListLBrace);
561
562	ProbablyBracedList = ProbablyBracedList \|\|
563	(Style.isJavaScript() &&
564	NextTok->isOneOf(K1: Keywords.kw_of, K2: Keywords.kw_in,
565	Ks: Keywords.kw_as));
566	ProbablyBracedList =
567	ProbablyBracedList \|\|
568	(IsCpp && (PrevTok->Tok.isLiteral() \|\|
569	NextTok->isOneOf(K1: tok::l_paren, K2: tok::arrow)));
570
571	// If there is a comma, semicolon or right paren after the closing
572	// brace, we assume this is a braced initializer list.
573	// FIXME: Some of these do not apply to JS, e.g. "} {" can never be a
574	// braced list in JS.
575	ProbablyBracedList =
576	ProbablyBracedList \|\|
577	NextTok->isOneOf(K1: tok::comma, K2: tok::period, Ks: tok::colon,
578	Ks: tok::r_paren, Ks: tok::r_square, Ks: tok::ellipsis);
579
580	// Distinguish between braced list in a constructor initializer list
581	// followed by constructor body, or just adjacent blocks.
582	ProbablyBracedList =
583	ProbablyBracedList \|\|
584	(NextTok->is(Kind: tok::l_brace) && LBraceStack.back().PrevTok &&
585	LBraceStack.back().PrevTok->isOneOf(K1: tok::identifier,
586	K2: tok::greater));
587
588	ProbablyBracedList =
589	ProbablyBracedList \|\|
590	(NextTok->is(Kind: tok::identifier) &&
591	!PrevTok->isOneOf(K1: tok::semi, K2: tok::r_brace, Ks: tok::l_brace));
592
593	ProbablyBracedList = ProbablyBracedList \|\|
594	(NextTok->is(Kind: tok::semi) &&
595	(!ExpectClassBody \|\| LBraceStack.size() != `1`));
596
597	ProbablyBracedList =
598	ProbablyBracedList \|\|
599	(NextTok->isBinaryOperator() && !NextIsObjCMethod);
600
601	if (!Style.isCSharp() && NextTok->is(Kind: tok::l_square)) {
602	// We can have an array subscript after a braced init
603	// list, but C++11 attributes are expected after blocks.
604	NextTok = Tokens->getNextToken();
605	ProbablyBracedList = NextTok->isNot(Kind: tok::l_square);
606	}
607
608	// Cpp macro definition body that is a nonempty braced list or block:
609	if (IsCpp && Line ->InMacroBody && PrevTok != FormatTok &&
610	!FormatTok->Previous && NextTok->is(Kind: tok::eof) &&
611	// A statement can end with only `;` (simple statement), a block
612	// closing brace (compound statement), or `:` (label statement).
613	// If PrevTok is a block opening brace, Tok ends an empty block.
614	!PrevTok->isOneOf(K1: tok::semi, K2: BK_Block, Ks: tok::colon)) {
615	ProbablyBracedList = true;
616	}
617	}
618	const auto BlockKind = ProbablyBracedList ? BK_BracedInit : BK_Block;
619	Tok->setBlockKind(BlockKind);
620	LBrace->setBlockKind(BlockKind);
621	}
622	LBraceStack.pop_back();
623	break;
624	case tok::identifier:
625	if (Tok->isNot(Kind: TT_StatementMacro))
626	break;
627	[[fallthrough]];
628	case tok::at:
629	case tok::semi:
630	case tok::kw_if:
631	case tok::kw_while:
632	case tok::kw_for:
633	case tok::kw_switch:
634	case tok::kw_try:
635	case tok::kw___try:
636	if (!LBraceStack.empty() && LBraceStack.back().Tok->is(BBK: BK_Unknown))
637	LBraceStack.back().Tok->setBlockKind(BK_Block);
638	break;
639	default:
640	break;
641	}
642
643	PrevTok = Tok;
644	Tok = NextTok;
645	} while (Tok->isNot(Kind: tok::eof) && !LBraceStack.empty());
646
647	// Assume other blocks for all unclosed opening braces.
648	for (const auto &Entry : LBraceStack)
649	if (Entry.Tok->is(BBK: BK_Unknown))
650	Entry.Tok->setBlockKind(BK_Block);
651
652	FormatTok = Tokens->setPosition(StoredPosition);
653	}
654
655	// Sets the token type of the directly previous right brace.
656	void UnwrappedLineParser::setPreviousRBraceType(TokenType Type) {
657	if (auto Prev = FormatTok->getPreviousNonComment();
658	Prev && Prev->is(Kind: tok::r_brace)) {
659	Prev->setFinalizedType(Type);
660	}
661	}
662
663	template <class T>
664	static inline void hash_combine(std::size_t &seed, const T &v) {
665	std::hash<T> hasher;
666	seed ^= hasher(v) + `0x9e3779b9` + (seed << `6`) + (seed >> `2`);
667	}
668
669	size_t UnwrappedLineParser::computePPHash() const {
670	size_t h = `0`;
671	for (const auto &i : PPStack) {
672	hash_combine(seed&: h, v: size_t(i.Kind));
673	hash_combine(seed&: h, v: i.Line);
674	}
675	return h;
676	}
677
678	// Checks whether \p ParsedLine might fit on a single line. If \p OpeningBrace
679	// is not null, subtracts its length (plus the preceding space) when computing
680	// the length of \p ParsedLine. We must clone the tokens of \p ParsedLine before
681	// running the token annotator on it so that we can restore them afterward.
682	bool UnwrappedLineParser::mightFitOnOneLine(
683	UnwrappedLine &ParsedLine, const FormatToken OpeningBrace) const* {
684	const auto ColumnLimit = Style.ColumnLimit;
685	if (ColumnLimit == `0`)
686	return true;
687
688	auto &Tokens = ParsedLine.Tokens;
689	assert(!Tokens.empty());
690
691	const auto *LastToken = Tokens.back().Tok;
692	assert(LastToken);
693
694	SmallVector<UnwrappedLineNode> SavedTokens(Tokens.size());
695
696	int Index = `0`;
697	for (const auto &Token : Tokens) {
698	assert(Token.Tok);
699	auto &SavedToken = SavedTokens [Index++];
700	SavedToken.Tok = new FormatToken;
701	SavedToken.Tok->copyFrom(Tok: *Token.Tok);
702	SavedToken.Children = std::move(Token.Children);
703	}
704
705	AnnotatedLine Line(ParsedLine);
706	assert(Line.Last == LastToken);
707
708	TokenAnnotator Annotator(Style, Keywords);
709	Annotator.annotate(Line);
710	Annotator.calculateFormattingInformation(Line);
711
712	auto Length = LastToken->TotalLength;
713	if (OpeningBrace) {
714	assert(OpeningBrace != Tokens.front().Tok);
715	if (auto Prev = OpeningBrace->Previous;
716	Prev && Prev->TotalLength + ColumnLimit == OpeningBrace->TotalLength) {
717	Length -= ColumnLimit;
718	}
719	Length -= OpeningBrace->TokenText.size() + `1`;
720	}
721
722	if (const auto *FirstToken = Line.First; FirstToken->is(Kind: tok::r_brace)) {
723	assert(!OpeningBrace \|\| OpeningBrace->is(TT_ControlStatementLBrace));
724	Length -= FirstToken->TokenText.size() + `1`;
725	}
726
727	Index = `0`;
728	for (auto &Token : Tokens) {
729	const auto &SavedToken = SavedTokens [Index++];
730	Token.Tok->copyFrom(Tok: *SavedToken.Tok);
731	Token.Children = std::move(SavedToken.Children);
732	delete SavedToken.Tok;
733	}
734
735	// If these change PPLevel needs to be used for get correct indentation.
736	assert(!Line.InMacroBody);
737	assert(!Line.InPPDirective);
738	return Line.Level * Style.IndentWidth + Length <= ColumnLimit;
739	}
740
741	FormatToken UnwrappedLineParser::parseBlock(bool* MustBeDeclaration,
742	unsigned AddLevels, bool MunchSemi,
743	bool KeepBraces,
744	IfStmtKind *IfKind,
745	bool UnindentWhitesmithsBraces) {
746	auto HandleVerilogBlockLabel = [this]() {
747	// ":" name
748	if (Style.isVerilog() && FormatTok->is(Kind: tok::colon)) {
749	nextToken();
750	if (Keywords.isVerilogIdentifier(Tok: *FormatTok))
751	nextToken();
752	}
753	};
754
755	// Whether this is a Verilog-specific block that has a special header like a
756	// module.
757	const bool VerilogHierarchy =
758	Style.isVerilog() && Keywords.isVerilogHierarchy(Tok: *FormatTok);
759	assert((FormatTok->isOneOf(tok::l_brace, TT_MacroBlockBegin) \|\|
760	(Style.isVerilog() &&
761	(Keywords.isVerilogBegin(*FormatTok) \|\| VerilogHierarchy))) &&
762	"'{' or macro block token expected");
763	FormatToken *Tok = FormatTok;
764	const bool FollowedByComment = Tokens->peekNextToken()->is(Kind: tok::comment);
765	auto Index = CurrentLines->size();
766	const bool MacroBlock = FormatTok->is(TT: TT_MacroBlockBegin);
767	FormatTok->setBlockKind(BK_Block);
768
769	// For Whitesmiths mode, jump to the next level prior to skipping over the
770	// braces.
771	if (!VerilogHierarchy && AddLevels > `0` &&
772	Style.BreakBeforeBraces == FormatStyle::BS_Whitesmiths) {
773	++Line ->Level;
774	}
775
776	size_t PPStartHash = computePPHash();
777
778	const unsigned InitialLevel = Line ->Level;
779	if (VerilogHierarchy) {
780	AddLevels += parseVerilogHierarchyHeader();
781	} else {
782	nextToken(/LevelDifference=/AddLevels);
783	HandleVerilogBlockLabel ();
784	}
785
786	// Bail out if there are too many levels. Otherwise, the stack might overflow.
787	if (Line ->Level > `300`)
788	return nullptr;
789
790	if (MacroBlock && FormatTok->is(Kind: tok::l_paren))
791	parseParens();
792
793	size_t NbPreprocessorDirectives =
794	!parsingPPDirective() ? PreprocessorDirectives.size() : `0`;
795	addUnwrappedLine();
796	size_t OpeningLineIndex =
797	CurrentLines->empty()
798	? (UnwrappedLine::kInvalidIndex)
799	: (CurrentLines->size() - `1` - NbPreprocessorDirectives);
800
801	// Whitesmiths is weird here. The brace needs to be indented for the namespace
802	// block, but the block itself may not be indented depending on the style
803	// settings. This allows the format to back up one level in those cases.
804	if (UnindentWhitesmithsBraces)
805	--Line ->Level;
806
807	ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
808	MustBeDeclaration);
809	if (AddLevels > `0u` && Style.BreakBeforeBraces != FormatStyle::BS_Whitesmiths)
810	Line ->Level += AddLevels;
811
812	FormatToken IfLBrace = nullptr*;
813	const bool SimpleBlock = parseLevel(OpeningBrace: Tok, IfKind, IfLeftBrace: &IfLBrace);
814
815	if (eof())
816	return IfLBrace;
817
818	if (MacroBlock ? FormatTok->isNot(Kind: TT_MacroBlockEnd)
819	: FormatTok->isNot(Kind: tok::r_brace)) {
820	Line ->Level = InitialLevel;
821	FormatTok->setBlockKind(BK_Block);
822	return IfLBrace;
823	}
824
825	if (FormatTok->is(Kind: tok::r_brace)) {
826	FormatTok->setBlockKind(BK_Block);
827	if (Tok->is(TT: TT_NamespaceLBrace))
828	FormatTok->setFinalizedType(TT_NamespaceRBrace);
829	}
830
831	const bool IsFunctionRBrace =
832	FormatTok->is(Kind: tok::r_brace) && Tok->is(TT: TT_FunctionLBrace);
833
834	auto RemoveBraces = [=]() mutable {
835	if (!SimpleBlock)
836	return false;
837	assert(Tok->isOneOf(TT_ControlStatementLBrace, TT_ElseLBrace));
838	assert(FormatTok->is(tok::r_brace));
839	const bool WrappedOpeningBrace = !Tok->Previous;
840	if (WrappedOpeningBrace && FollowedByComment)
841	return false;
842	const bool HasRequiredIfBraces = IfLBrace && !IfLBrace->Optional;
843	if (KeepBraces && !HasRequiredIfBraces)
844	return false;
845	if (Tok->isNot(Kind: TT_ElseLBrace) \|\| !HasRequiredIfBraces) {
846	const FormatToken *Previous = Tokens->getPreviousToken();
847	assert(Previous);
848	if (Previous->is(Kind: tok::r_brace) && !Previous->Optional)
849	return false;
850	}
851	assert(!CurrentLines->empty());
852	auto &LastLine = CurrentLines->back();
853	if (LastLine.Level == InitialLevel + `1` && !mightFitOnOneLine(ParsedLine&: LastLine))
854	return false;
855	if (Tok->is(TT: TT_ElseLBrace))
856	return true;
857	if (WrappedOpeningBrace) {
858	assert(Index > `0`);
859	--Index; // The line above the wrapped l_brace.
860	Tok = nullptr;
861	}
862	return mightFitOnOneLine(ParsedLine&: (*CurrentLines)[Index], OpeningBrace: Tok);
863	};
864	if (RemoveBraces ()) {
865	Tok->MatchingParen = FormatTok;
866	FormatTok->MatchingParen = Tok;
867	}
868
869	size_t PPEndHash = computePPHash();
870
871	// Munch the closing brace.
872	nextToken(/LevelDifference=/-AddLevels);
873
874	// When this is a function block and there is an unnecessary semicolon
875	// afterwards then mark it as optional (so the RemoveSemi pass can get rid of
876	// it later).
877	if (Style.RemoveSemicolon && IsFunctionRBrace) {
878	while (FormatTok->is(Kind: tok::semi)) {
879	FormatTok->Optional = true;
880	nextToken();
881	}
882	}
883
884	HandleVerilogBlockLabel ();
885
886	if (MacroBlock && FormatTok->is(Kind: tok::l_paren))
887	parseParens();
888
889	Line ->Level = InitialLevel;
890
891	if (FormatTok->is(Kind: tok::kw_noexcept)) {
892	// A noexcept in a requires expression.
893	nextToken();
894	}
895
896	if (FormatTok->is(Kind: tok::arrow)) {
897	// Following the } or noexcept we can find a trailing return type arrow
898	// as part of an implicit conversion constraint.
899	nextToken();
900	parseStructuralElement();
901	}
902
903	if (MunchSemi && FormatTok->is(Kind: tok::semi))
904	nextToken();
905
906	if (PPStartHash == PPEndHash) {
907	Line ->MatchingOpeningBlockLineIndex = OpeningLineIndex;
908	if (OpeningLineIndex != UnwrappedLine::kInvalidIndex) {
909	// Update the opening line to add the forward reference as well
910	(*CurrentLines)[OpeningLineIndex].MatchingClosingBlockLineIndex =
911	CurrentLines->size() - `1`;
912	}
913	}
914
915	return IfLBrace;
916	}
917
918	static bool isGoogScope(const UnwrappedLine &Line) {
919	// FIXME: Closure-library specific stuff should not be hard-coded but be
920	// configurable.
921	if (Line.Tokens.size() < `4`)
922	return false;
923	auto I = Line.Tokens.begin();
924	if (I ->Tok->TokenText != "goog")
925	return false;
926	++I;
927	if (I ->Tok->isNot(Kind: tok::period))
928	return false;
929	++I;
930	if (I ->Tok->TokenText != "scope")
931	return false;
932	++I;
933	return I ->Tok->is(Kind: tok::l_paren);
934	}
935
936	static bool isIIFE(const UnwrappedLine &Line,
937	const AdditionalKeywords &Keywords) {
938	// Look for the start of an immediately invoked anonymous function.
939	// https://en.wikipedia.org/wiki/Immediately-invoked_function_expression
940	// This is commonly done in JavaScript to create a new, anonymous scope.
941	// Example: (function() { ... })()
942	if (Line.Tokens.size() < `3`)
943	return false;
944	auto I = Line.Tokens.begin();
945	if (I ->Tok->isNot(Kind: tok::l_paren))
946	return false;
947	++I;
948	if (I ->Tok->isNot(Kind: Keywords.kw_function))
949	return false;
950	++I;
951	return I ->Tok->is(Kind: tok::l_paren);
952	}
953
954	static bool ShouldBreakBeforeBrace(const FormatStyle &Style,
955	const FormatToken &InitialToken) {
956	tok::TokenKind Kind = InitialToken.Tok.getKind();
957	if (InitialToken.is(TT: TT_NamespaceMacro))
958	Kind = tok::kw_namespace;
959
960	switch (Kind) {
961	case tok::kw_namespace:
962	return Style.BraceWrapping.AfterNamespace;
963	case tok::kw_class:
964	return Style.BraceWrapping.AfterClass;
965	case tok::kw_union:
966	return Style.BraceWrapping.AfterUnion;
967	case tok::kw_struct:
968	return Style.BraceWrapping.AfterStruct;
969	case tok::kw_enum:
970	return Style.BraceWrapping.AfterEnum;
971	default:
972	return false;
973	}
974	}
975
976	void UnwrappedLineParser::parseChildBlock() {
977	assert(FormatTok->is(tok::l_brace));
978	FormatTok->setBlockKind(BK_Block);
979	const FormatToken *OpeningBrace = FormatTok;
980	nextToken();
981	{
982	bool SkipIndent = (Style.isJavaScript() &&
983	(isGoogScope(Line: Line) \|\| isIIFE(Line: Line, Keywords)));
984	ScopedLineState LineState(*this);
985	ScopedDeclarationState DeclarationState(*Line, DeclarationScopeStack,
986	/MustBeDeclaration=/false);
987	Line ->Level += SkipIndent ? `0` : `1`;
988	parseLevel(OpeningBrace);
989	flushComments(NewlineBeforeNext: isOnNewLine(FormatTok: *FormatTok));
990	Line ->Level -= SkipIndent ? `0` : `1`;
991	}
992	nextToken();
993	}
994
995	void UnwrappedLineParser::parsePPDirective() {
996	assert(FormatTok->is(tok::hash) && "'#' expected");
997	ScopedMacroState MacroState(*Line, Tokens, FormatTok);
998
999	nextToken();
1000
1001	if (!FormatTok->Tok.getIdentifierInfo()) {
1002	parsePPUnknown();
1003	return;
1004	}
1005
1006	switch (FormatTok->Tok.getIdentifierInfo()->getPPKeywordID()) {
1007	case tok::pp_define:
1008	parsePPDefine();
1009	return;
1010	case tok::pp_if:
1011	parsePPIf(/IfDef=/false);
1012	break;
1013	case tok::pp_ifdef:
1014	case tok::pp_ifndef:
1015	parsePPIf(/IfDef=/true);
1016	break;
1017	case tok::pp_else:
1018	case tok::pp_elifdef:
1019	case tok::pp_elifndef:
1020	case tok::pp_elif:
1021	parsePPElse();
1022	break;
1023	case tok::pp_endif:
1024	parsePPEndIf();
1025	break;
1026	case tok::pp_pragma:
1027	parsePPPragma();
1028	break;
1029	case tok::pp_error:
1030	case tok::pp_warning:
1031	nextToken();
1032	if (!eof() && Style.isCpp())
1033	FormatTok->setFinalizedType(TT_AfterPPDirective);
1034	[[fallthrough]];
1035	default:
1036	parsePPUnknown();
1037	break;
1038	}
1039	}
1040
1041	void UnwrappedLineParser::conditionalCompilationCondition(bool Unreachable) {
1042	size_t Line = CurrentLines->size();
1043	if (CurrentLines == &PreprocessorDirectives)
1044	Line += Lines.size();
1045
1046	if (Unreachable \|\|
1047	(!PPStack.empty() && PPStack.back().Kind == PP_Unreachable)) {
1048	PPStack.push_back(Elt: {PP_Unreachable, Line});
1049	} else {
1050	PPStack.push_back(Elt: {PP_Conditional, Line});
1051	}
1052	}
1053
1054	void UnwrappedLineParser::conditionalCompilationStart(bool Unreachable) {
1055	++PPBranchLevel;
1056	assert(PPBranchLevel >= `0` && PPBranchLevel <= (int)PPLevelBranchIndex.size());
1057	if (PPBranchLevel == (int)PPLevelBranchIndex.size()) {
1058	PPLevelBranchIndex.push_back(Elt: `0`);
1059	PPLevelBranchCount.push_back(Elt: `0`);
1060	}
1061	PPChainBranchIndex.push(x: Unreachable ? -`1` : `0`);
1062	bool Skip = PPLevelBranchIndex [PPBranchLevel] > `0`;
1063	conditionalCompilationCondition(Unreachable: Unreachable \|\| Skip);
1064	}
1065
1066	void UnwrappedLineParser::conditionalCompilationAlternative() {
1067	if (!PPStack.empty())
1068	PPStack.pop_back();
1069	assert(PPBranchLevel < (int)PPLevelBranchIndex.size());
1070	if (!PPChainBranchIndex.empty())
1071	++PPChainBranchIndex.top();
1072	conditionalCompilationCondition(
1073	Unreachable: PPBranchLevel >= `0` && !PPChainBranchIndex.empty() &&
1074	PPLevelBranchIndex [PPBranchLevel] != PPChainBranchIndex.top());
1075	}
1076
1077	void UnwrappedLineParser::conditionalCompilationEnd() {
1078	assert(PPBranchLevel < (int)PPLevelBranchIndex.size());
1079	if (PPBranchLevel >= `0` && !PPChainBranchIndex.empty()) {
1080	if (PPChainBranchIndex.top() + `1` > PPLevelBranchCount [PPBranchLevel])
1081	PPLevelBranchCount [PPBranchLevel] = PPChainBranchIndex.top() + `1`;
1082	}
1083	// Guard against #endif's without #if.
1084	if (PPBranchLevel > -`1`)
1085	--PPBranchLevel;
1086	if (!PPChainBranchIndex.empty())
1087	PPChainBranchIndex.pop();
1088	if (!PPStack.empty())
1089	PPStack.pop_back();
1090	}
1091
1092	void UnwrappedLineParser::parsePPIf(bool IfDef) {
1093	bool IfNDef = FormatTok->is(Kind: tok::pp_ifndef);
1094	nextToken();
1095	bool Unreachable = false;
1096	if (!IfDef && (FormatTok->is(Kind: tok::kw_false) \|\| FormatTok->TokenText == "0"))
1097	Unreachable = true;
1098	if (IfDef && !IfNDef && FormatTok->TokenText == "SWIG")
1099	Unreachable = true;
1100	conditionalCompilationStart(Unreachable);
1101	FormatToken *IfCondition = FormatTok;
1102	// If there's a #ifndef on the first line, and the only lines before it are
1103	// comments, it could be an include guard.
1104	bool MaybeIncludeGuard = IfNDef;
1105	if (IncludeGuard == IG_Inited && MaybeIncludeGuard) {
1106	for (auto &Line : Lines) {
1107	if (Line.Tokens.front().Tok->isNot(Kind: tok::comment)) {
1108	MaybeIncludeGuard = false;
1109	IncludeGuard = IG_Rejected;
1110	break;
1111	}
1112	}
1113	}
1114	--PPBranchLevel;
1115	parsePPUnknown();
1116	++PPBranchLevel;
1117	if (IncludeGuard == IG_Inited && MaybeIncludeGuard) {
1118	IncludeGuard = IG_IfNdefed;
1119	IncludeGuardToken = IfCondition;
1120	}
1121	}
1122
1123	void UnwrappedLineParser::parsePPElse() {
1124	// If a potential include guard has an #else, it's not an include guard.
1125	if (IncludeGuard == IG_Defined && PPBranchLevel == `0`)
1126	IncludeGuard = IG_Rejected;
1127	// Don't crash when there is an #else without an #if.
1128	assert(PPBranchLevel >= -`1`);
1129	if (PPBranchLevel == -`1`)
1130	conditionalCompilationStart(/Unreachable=/true);
1131	conditionalCompilationAlternative();
1132	--PPBranchLevel;
1133	parsePPUnknown();
1134	++PPBranchLevel;
1135	}
1136
1137	void UnwrappedLineParser::parsePPEndIf() {
1138	conditionalCompilationEnd();
1139	parsePPUnknown();
1140	// If the #endif of a potential include guard is the last thing in the file,
1141	// then we found an include guard.
1142	if (IncludeGuard == IG_Defined && PPBranchLevel == -`1` && Tokens->isEOF() &&
1143	Style.IndentPPDirectives != FormatStyle::PPDIS_None) {
1144	IncludeGuard = IG_Found;
1145	}
1146	}
1147
1148	void UnwrappedLineParser::parsePPDefine() {
1149	nextToken();
1150
1151	if (!FormatTok->Tok.getIdentifierInfo()) {
1152	IncludeGuard = IG_Rejected;
1153	IncludeGuardToken = nullptr;
1154	parsePPUnknown();
1155	return;
1156	}
1157
1158	bool MaybeIncludeGuard = false;
1159	if (IncludeGuard == IG_IfNdefed &&
1160	IncludeGuardToken->TokenText == FormatTok->TokenText) {
1161	IncludeGuard = IG_Defined;
1162	IncludeGuardToken = nullptr;
1163	for (auto &Line : Lines) {
1164	if (!Line.Tokens.front().Tok->isOneOf(K1: tok::comment, K2: tok::hash)) {
1165	IncludeGuard = IG_Rejected;
1166	break;
1167	}
1168	}
1169	MaybeIncludeGuard = IncludeGuard == IG_Defined;
1170	}
1171
1172	// In the context of a define, even keywords should be treated as normal
1173	// identifiers. Setting the kind to identifier is not enough, because we need
1174	// to treat additional keywords like __except as well, which are already
1175	// identifiers. Setting the identifier info to null interferes with include
1176	// guard processing above, and changes preprocessing nesting.
1177	FormatTok->Tok.setKind(tok::identifier);
1178	FormatTok->Tok.setIdentifierInfo(Keywords.kw_internal_ident_after_define);
1179	nextToken();
1180
1181	// IncludeGuard can't have a non-empty macro definition.
1182	if (MaybeIncludeGuard && !eof())
1183	IncludeGuard = IG_Rejected;
1184
1185	if (FormatTok->Tok.getKind() == tok::l_paren &&
1186	!FormatTok->hasWhitespaceBefore()) {
1187	parseParens();
1188	}
1189	if (Style.IndentPPDirectives != FormatStyle::PPDIS_None)
1190	Line ->Level += PPBranchLevel + `1`;
1191	addUnwrappedLine();
1192	++Line ->Level;
1193
1194	Line ->PPLevel = PPBranchLevel + (IncludeGuard == IG_Defined ? `0` : `1`);
1195	assert((int)Line->PPLevel >= `0`);
1196	Line ->InMacroBody = true;
1197
1198	if (Style.SkipMacroDefinitionBody) {
1199	while (!eof()) {
1200	FormatTok->Finalized = true;
1201	FormatTok = Tokens->getNextToken();
1202	}
1203	addUnwrappedLine();
1204	return;
1205	}
1206
1207	// Errors during a preprocessor directive can only affect the layout of the
1208	// preprocessor directive, and thus we ignore them. An alternative approach
1209	// would be to use the same approach we use on the file level (no
1210	// re-indentation if there was a structural error) within the macro
1211	// definition.
1212	parseFile();
1213	}
1214
1215	void UnwrappedLineParser::parsePPPragma() {
1216	Line ->InPragmaDirective = true;
1217	parsePPUnknown();
1218	}
1219
1220	void UnwrappedLineParser::parsePPUnknown() {
1221	while (!eof())
1222	nextToken();
1223	if (Style.IndentPPDirectives != FormatStyle::PPDIS_None)
1224	Line ->Level += PPBranchLevel + `1`;
1225	addUnwrappedLine();
1226	}
1227
1228	// Here we exclude certain tokens that are not usually the first token in an
1229	// unwrapped line. This is used in attempt to distinguish macro calls without
1230	// trailing semicolons from other constructs split to several lines.
1231	static bool tokenCanStartNewLine(const FormatToken &Tok) {
1232	// Semicolon can be a null-statement, l_square can be a start of a macro or
1233	// a C++11 attribute, but this doesn't seem to be common.
1234	return !Tok.isOneOf(K1: tok::semi, K2: tok::l_brace,
1235	// Tokens that can only be used as binary operators and a
1236	// part of overloaded operator names.
1237	Ks: tok::period, Ks: tok::periodstar, Ks: tok::arrow, Ks: tok::arrowstar,
1238	Ks: tok::less, Ks: tok::greater, Ks: tok::slash, Ks: tok::percent,
1239	Ks: tok::lessless, Ks: tok::greatergreater, Ks: tok::equal,
1240	Ks: tok::plusequal, Ks: tok::minusequal, Ks: tok::starequal,
1241	Ks: tok::slashequal, Ks: tok::percentequal, Ks: tok::ampequal,
1242	Ks: tok::pipeequal, Ks: tok::caretequal, Ks: tok::greatergreaterequal,
1243	Ks: tok::lesslessequal,
1244	// Colon is used in labels, base class lists, initializer
1245	// lists, range-based for loops, ternary operator, but
1246	// should never be the first token in an unwrapped line.
1247	Ks: tok::colon,
1248	// 'noexcept' is a trailing annotation.
1249	Ks: tok::kw_noexcept);
1250	}
1251
1252	static bool mustBeJSIdent(const AdditionalKeywords &Keywords,
1253	const FormatToken *FormatTok) {
1254	// FIXME: This returns true for C/C++ keywords like 'struct'.
1255	return FormatTok->is(Kind: tok::identifier) &&
1256	(!FormatTok->Tok.getIdentifierInfo() \|\|
1257	!FormatTok->isOneOf(
1258	K1: Keywords.kw_in, K2: Keywords.kw_of, Ks: Keywords.kw_as, Ks: Keywords.kw_async,
1259	Ks: Keywords.kw_await, Ks: Keywords.kw_yield, Ks: Keywords.kw_finally,
1260	Ks: Keywords.kw_function, Ks: Keywords.kw_import, Ks: Keywords.kw_is,
1261	Ks: Keywords.kw_let, Ks: Keywords.kw_var, Ks: tok::kw_const,
1262	Ks: Keywords.kw_abstract, Ks: Keywords.kw_extends, Ks: Keywords.kw_implements,
1263	Ks: Keywords.kw_instanceof, Ks: Keywords.kw_interface,
1264	Ks: Keywords.kw_override, Ks: Keywords.kw_throws, Ks: Keywords.kw_from));
1265	}
1266
1267	static bool mustBeJSIdentOrValue(const AdditionalKeywords &Keywords,
1268	const FormatToken *FormatTok) {
1269	return FormatTok->Tok.isLiteral() \|\|
1270	FormatTok->isOneOf(K1: tok::kw_true, K2: tok::kw_false) \|\|
1271	mustBeJSIdent(Keywords, FormatTok);
1272	}
1273
1274	// isJSDeclOrStmt returns true if \|FormatTok\| starts a declaration or statement
1275	// when encountered after a value (see mustBeJSIdentOrValue).
1276	static bool isJSDeclOrStmt(const AdditionalKeywords &Keywords,
1277	const FormatToken *FormatTok) {
1278	return FormatTok->isOneOf(
1279	K1: tok::kw_return, K2: Keywords.kw_yield,
1280	// conditionals
1281	Ks: tok::kw_if, Ks: tok::kw_else,
1282	// loops
1283	Ks: tok::kw_for, Ks: tok::kw_while, Ks: tok::kw_do, Ks: tok::kw_continue, Ks: tok::kw_break,
1284	// switch/case
1285	Ks: tok::kw_switch, Ks: tok::kw_case,
1286	// exceptions
1287	Ks: tok::kw_throw, Ks: tok::kw_try, Ks: tok::kw_catch, Ks: Keywords.kw_finally,
1288	// declaration
1289	Ks: tok::kw_const, Ks: tok::kw_class, Ks: Keywords.kw_var, Ks: Keywords.kw_let,
1290	Ks: Keywords.kw_async, Ks: Keywords.kw_function,
1291	// import/export
1292	Ks: Keywords.kw_import, Ks: tok::kw_export);
1293	}
1294
1295	// Checks whether a token is a type in K&R C (aka C78).
1296	static bool isC78Type(const FormatToken &Tok) {
1297	return Tok.isOneOf(K1: tok::kw_char, K2: tok::kw_short, Ks: tok::kw_int, Ks: tok::kw_long,
1298	Ks: tok::kw_unsigned, Ks: tok::kw_float, Ks: tok::kw_double,
1299	Ks: tok::identifier);
1300	}
1301
1302	// This function checks whether a token starts the first parameter declaration
1303	// in a K&R C (aka C78) function definition, e.g.:
1304	// int f(a, b)
1305	// short a, b;
1306	// {
1307	// return a + b;
1308	// }
1309	static bool isC78ParameterDecl(const FormatToken Tok, const* FormatToken *Next,
1310	const FormatToken *FuncName) {
1311	assert(Tok);
1312	assert(Next);
1313	assert(FuncName);
1314
1315	if (FuncName->isNot(Kind: tok::identifier))
1316	return false;
1317
1318	const FormatToken *Prev = FuncName->Previous;
1319	if (!Prev \|\| (Prev->isNot(Kind: tok::star) && !isC78Type(Tok: *Prev)))
1320	return false;
1321
1322	if (!isC78Type(Tok: *Tok) &&
1323	!Tok->isOneOf(K1: tok::kw_register, K2: tok::kw_struct, Ks: tok::kw_union)) {
1324	return false;
1325	}
1326
1327	if (Next->isNot(Kind: tok::star) && !Next->Tok.getIdentifierInfo())
1328	return false;
1329
1330	Tok = Tok->Previous;
1331	if (!Tok \|\| Tok->isNot(Kind: tok::r_paren))
1332	return false;
1333
1334	Tok = Tok->Previous;
1335	if (!Tok \|\| Tok->isNot(Kind: tok::identifier))
1336	return false;
1337
1338	return Tok->Previous && Tok->Previous->isOneOf(K1: tok::l_paren, K2: tok::comma);
1339	}
1340
1341	bool UnwrappedLineParser::parseModuleImport() {
1342	assert(FormatTok->is(Keywords.kw_import) && "'import' expected");
1343
1344	if (auto Token = Tokens->peekNextToken(/SkipComment=/true);
1345	!Token->Tok.getIdentifierInfo() &&
1346	!Token->isOneOf(K1: tok::colon, K2: tok::less, Ks: tok::string_literal)) {
1347	return false;
1348	}
1349
1350	nextToken();
1351	while (!eof()) {
1352	if (FormatTok->is(Kind: tok::colon)) {
1353	FormatTok->setFinalizedType(TT_ModulePartitionColon);
1354	}
1355	// Handle import <foo/bar.h> as we would an include statement.
1356	else if (FormatTok->is(Kind: tok::less)) {
1357	nextToken();
1358	while (!FormatTok->isOneOf(K1: tok::semi, K2: tok::greater) && !eof()) {
1359	// Mark tokens up to the trailing line comments as implicit string
1360	// literals.
1361	if (FormatTok->isNot(Kind: tok::comment) &&
1362	!FormatTok->TokenText.starts_with(Prefix: "//")) {
1363	FormatTok->setFinalizedType(TT_ImplicitStringLiteral);
1364	}
1365	nextToken();
1366	}
1367	}
1368	if (FormatTok->is(Kind: tok::semi)) {
1369	nextToken();
1370	break;
1371	}
1372	nextToken();
1373	}
1374
1375	addUnwrappedLine();
1376	return true;
1377	}
1378
1379	// readTokenWithJavaScriptASI reads the next token and terminates the current
1380	// line if JavaScript Automatic Semicolon Insertion must
1381	// happen between the current token and the next token.
1382	//
1383	// This method is conservative - it cannot cover all edge cases of JavaScript,
1384	// but only aims to correctly handle certain well known cases. It must not
1385	// return true in speculative cases.
1386	void UnwrappedLineParser::readTokenWithJavaScriptASI() {
1387	FormatToken *Previous = FormatTok;
1388	readToken();
1389	FormatToken *Next = FormatTok;
1390
1391	bool IsOnSameLine =
1392	CommentsBeforeNextToken.empty()
1393	? Next->NewlinesBefore == `0`
1394	: CommentsBeforeNextToken.front()->NewlinesBefore == `0`;
1395	if (IsOnSameLine)
1396	return;
1397
1398	bool PreviousMustBeValue = mustBeJSIdentOrValue(Keywords, FormatTok: Previous);
1399	bool PreviousStartsTemplateExpr =
1400	Previous->is(TT: TT_TemplateString) && Previous->TokenText.ends_with(Suffix: "${");
1401	if (PreviousMustBeValue \|\| Previous->is(Kind: tok::r_paren)) {
1402	// If the line contains an '@' sign, the previous token might be an
1403	// annotation, which can precede another identifier/value.
1404	bool HasAt = llvm::any_of(Range&: Line ->Tokens, P: [](UnwrappedLineNode &LineNode) {
1405	return LineNode.Tok->is(Kind: tok::at);
1406	});
1407	if (HasAt)
1408	return;
1409	}
1410	if (Next->is(Kind: tok::exclaim) && PreviousMustBeValue)
1411	return addUnwrappedLine();
1412	bool NextMustBeValue = mustBeJSIdentOrValue(Keywords, FormatTok: Next);
1413	bool NextEndsTemplateExpr =
1414	Next->is(TT: TT_TemplateString) && Next->TokenText.starts_with(Prefix: "}");
1415	if (NextMustBeValue && !NextEndsTemplateExpr && !PreviousStartsTemplateExpr &&
1416	(PreviousMustBeValue \|\|
1417	Previous->isOneOf(K1: tok::r_square, K2: tok::r_paren, Ks: tok::plusplus,
1418	Ks: tok::minusminus))) {
1419	return addUnwrappedLine();
1420	}
1421	if ((PreviousMustBeValue \|\| Previous->is(Kind: tok::r_paren)) &&
1422	isJSDeclOrStmt(Keywords, FormatTok: Next)) {
1423	return addUnwrappedLine();
1424	}
1425	}
1426
1427	void UnwrappedLineParser::parseStructuralElement(
1428	const FormatToken OpeningBrace, IfStmtKind IfKind,
1429	FormatToken *IfLeftBrace, bool* HasDoWhile, bool* *HasLabel) {
1430	if (Style.isTableGen() && FormatTok->is(Kind: tok::pp_include)) {
1431	nextToken();
1432	if (FormatTok->is(Kind: tok::string_literal))
1433	nextToken();
1434	addUnwrappedLine();
1435	return;
1436	}
1437
1438	if (IsCpp) {
1439	while (FormatTok->is(Kind: tok::l_square) && handleCppAttributes()) {
1440	}
1441	} else if (Style.isVerilog()) {
1442	if (Keywords.isVerilogStructuredProcedure(Tok: *FormatTok)) {
1443	parseForOrWhileLoop(/HasParens=/false);
1444	return;
1445	}
1446	if (FormatTok->isOneOf(K1: Keywords.kw_foreach, K2: Keywords.kw_repeat)) {
1447	parseForOrWhileLoop();
1448	return;
1449	}
1450	if (FormatTok->isOneOf(K1: tok::kw_restrict, K2: Keywords.kw_assert,
1451	Ks: Keywords.kw_assume, Ks: Keywords.kw_cover)) {
1452	parseIfThenElse(IfKind, /KeepBraces=/false, /IsVerilogAssert=/true);
1453	return;
1454	}
1455
1456	// Skip things that can exist before keywords like 'if' and 'case'.
1457	while (true) {
1458	if (FormatTok->isOneOf(K1: Keywords.kw_priority, K2: Keywords.kw_unique,
1459	Ks: Keywords.kw_unique0)) {
1460	nextToken();
1461	} else if (FormatTok->is(Kind: tok::l_paren) &&
1462	Tokens->peekNextToken()->is(Kind: tok::star)) {
1463	parseParens();
1464	} else {
1465	break;
1466	}
1467	}
1468	}
1469
1470	// Tokens that only make sense at the beginning of a line.
1471	if (FormatTok->isAccessSpecifierKeyword()) {
1472	if (Style.isJava() \|\| Style.isJavaScript() \|\| Style.isCSharp())
1473	nextToken();
1474	else
1475	parseAccessSpecifier();
1476	return;
1477	}
1478	switch (FormatTok->Tok.getKind()) {
1479	case tok::kw_asm:
1480	nextToken();
1481	if (FormatTok->is(Kind: tok::l_brace)) {
1482	FormatTok->setFinalizedType(TT_InlineASMBrace);
1483	nextToken();
1484	while (FormatTok && !eof()) {
1485	if (FormatTok->is(Kind: tok::r_brace)) {
1486	FormatTok->setFinalizedType(TT_InlineASMBrace);
1487	nextToken();
1488	addUnwrappedLine();
1489	break;
1490	}
1491	FormatTok->Finalized = true;
1492	nextToken();
1493	}
1494	}
1495	break;
1496	case tok::kw_namespace:
1497	parseNamespace();
1498	return;
1499	case tok::kw_if: {
1500	if (Style.isJavaScript() && Line ->MustBeDeclaration) {
1501	// field/method declaration.
1502	break;
1503	}
1504	FormatToken *Tok = parseIfThenElse(IfKind);
1505	if (IfLeftBrace)
1506	*IfLeftBrace = Tok;
1507	return;
1508	}
1509	case tok::kw_for:
1510	case tok::kw_while:
1511	if (Style.isJavaScript() && Line ->MustBeDeclaration) {
1512	// field/method declaration.
1513	break;
1514	}
1515	parseForOrWhileLoop();
1516	return;
1517	case tok::kw_do:
1518	if (Style.isJavaScript() && Line ->MustBeDeclaration) {
1519	// field/method declaration.
1520	break;
1521	}
1522	parseDoWhile();
1523	if (HasDoWhile)
1524	HasDoWhile = true*;
1525	return;
1526	case tok::kw_switch:
1527	if (Style.isJavaScript() && Line ->MustBeDeclaration) {
1528	// 'switch: string' field declaration.
1529	break;
1530	}
1531	parseSwitch(/IsExpr=/false);
1532	return;
1533	case tok::kw_default: {
1534	// In Verilog default along with other labels are handled in the next loop.
1535	if (Style.isVerilog())
1536	break;
1537	if (Style.isJavaScript() && Line ->MustBeDeclaration) {
1538	// 'default: string' field declaration.
1539	break;
1540	}
1541	auto *Default = FormatTok;
1542	nextToken();
1543	if (FormatTok->is(Kind: tok::colon)) {
1544	FormatTok->setFinalizedType(TT_CaseLabelColon);
1545	parseLabel();
1546	return;
1547	}
1548	if (FormatTok->is(Kind: tok::arrow)) {
1549	FormatTok->setFinalizedType(TT_CaseLabelArrow);
1550	Default->setFinalizedType(TT_SwitchExpressionLabel);
1551	parseLabel();
1552	return;
1553	}
1554	// e.g. "default void f() {}" in a Java interface.
1555	break;
1556	}
1557	case tok::kw_case:
1558	// Proto: there are no switch/case statements.
1559	if (Style.Language == FormatStyle::LK_Proto) {
1560	nextToken();
1561	return;
1562	}
1563	if (Style.isVerilog()) {
1564	parseBlock();
1565	addUnwrappedLine();
1566	return;
1567	}
1568	if (Style.isJavaScript() && Line ->MustBeDeclaration) {
1569	// 'case: string' field declaration.
1570	nextToken();
1571	break;
1572	}
1573	parseCaseLabel();
1574	return;
1575	case tok::kw_goto:
1576	nextToken();
1577	if (FormatTok->is(Kind: tok::kw_case))
1578	nextToken();
1579	break;
1580	case tok::kw_try:
1581	case tok::kw___try:
1582	if (Style.isJavaScript() && Line ->MustBeDeclaration) {
1583	// field/method declaration.
1584	break;
1585	}
1586	parseTryCatch();
1587	return;
1588	case tok::kw_extern:
1589	nextToken();
1590	if (Style.isVerilog()) {
1591	// In Verilog and extern module declaration looks like a start of module.
1592	// But there is no body and endmodule. So we handle it separately.
1593	if (Keywords.isVerilogHierarchy(Tok: *FormatTok)) {
1594	parseVerilogHierarchyHeader();
1595	return;
1596	}
1597	} else if (FormatTok->is(Kind: tok::string_literal)) {
1598	nextToken();
1599	if (FormatTok->is(Kind: tok::l_brace)) {
1600	if (Style.BraceWrapping.AfterExternBlock)
1601	addUnwrappedLine();
1602	// Either we indent or for backwards compatibility we follow the
1603	// AfterExternBlock style.
1604	unsigned AddLevels =
1605	(Style.IndentExternBlock == FormatStyle::IEBS_Indent) \|\|
1606	(Style.BraceWrapping.AfterExternBlock &&
1607	Style.IndentExternBlock ==
1608	FormatStyle::IEBS_AfterExternBlock)
1609	? `1u`
1610	: `0u`;
1611	parseBlock(/MustBeDeclaration=/true, AddLevels);
1612	addUnwrappedLine();
1613	return;
1614	}
1615	}
1616	break;
1617	case tok::kw_export:
1618	if (Style.isJavaScript()) {
1619	parseJavaScriptEs6ImportExport();
1620	return;
1621	}
1622	if (IsCpp) {
1623	nextToken();
1624	if (FormatTok->is(Kind: tok::kw_namespace)) {
1625	parseNamespace();
1626	return;
1627	}
1628	if (FormatTok->is(Kind: tok::l_brace)) {
1629	parseCppExportBlock();
1630	return;
1631	}
1632	if (FormatTok->is(II: Keywords.kw_import) && parseModuleImport())
1633	return;
1634	}
1635	break;
1636	case tok::kw_inline:
1637	nextToken();
1638	if (FormatTok->is(Kind: tok::kw_namespace)) {
1639	parseNamespace();
1640	return;
1641	}
1642	break;
1643	case tok::identifier:
1644	if (FormatTok->is(TT: TT_ForEachMacro)) {
1645	parseForOrWhileLoop();
1646	return;
1647	}
1648	if (FormatTok->is(TT: TT_MacroBlockBegin)) {
1649	parseBlock(/MustBeDeclaration=/false, /AddLevels=/`1u`,
1650	/MunchSemi=/false);
1651	return;
1652	}
1653	if (FormatTok->is(II: Keywords.kw_import)) {
1654	if (Style.isJavaScript()) {
1655	parseJavaScriptEs6ImportExport();
1656	return;
1657	}
1658	if (Style.Language == FormatStyle::LK_Proto) {
1659	nextToken();
1660	if (FormatTok->is(Kind: tok::kw_public))
1661	nextToken();
1662	if (FormatTok->isNot(Kind: tok::string_literal))
1663	return;
1664	nextToken();
1665	if (FormatTok->is(Kind: tok::semi))
1666	nextToken();
1667	addUnwrappedLine();
1668	return;
1669	}
1670	if (IsCpp && parseModuleImport())
1671	return;
1672	}
1673	if (IsCpp && FormatTok->isOneOf(K1: Keywords.kw_signals, K2: Keywords.kw_qsignals,
1674	Ks: Keywords.kw_slots, Ks: Keywords.kw_qslots)) {
1675	nextToken();
1676	if (FormatTok->is(Kind: tok::colon)) {
1677	nextToken();
1678	addUnwrappedLine();
1679	return;
1680	}
1681	}
1682	if (IsCpp && FormatTok->is(TT: TT_StatementMacro)) {
1683	parseStatementMacro();
1684	return;
1685	}
1686	if (IsCpp && FormatTok->is(TT: TT_NamespaceMacro)) {
1687	parseNamespace();
1688	return;
1689	}
1690	// In Verilog labels can be any expression, so we don't do them here.
1691	// JS doesn't have macros, and within classes colons indicate fields, not
1692	// labels.
1693	// TableGen doesn't have labels.
1694	if (!Style.isJavaScript() && !Style.isVerilog() && !Style.isTableGen() &&
1695	Tokens->peekNextToken()->is(Kind: tok::colon) && !Line ->MustBeDeclaration) {
1696	nextToken();
1697	if (!Line ->InMacroBody \|\| CurrentLines->size() > `1`)
1698	Line ->Tokens.begin()->Tok->MustBreakBefore = true;
1699	FormatTok->setFinalizedType(TT_GotoLabelColon);
1700	parseLabel(LeftAlignLabel: !Style.IndentGotoLabels);
1701	if (HasLabel)
1702	HasLabel = true*;
1703	return;
1704	}
1705	if (Style.isJava() && FormatTok->is(II: Keywords.kw_record)) {
1706	parseRecord(/ParseAsExpr=/false, /IsJavaRecord=/true);
1707	addUnwrappedLine();
1708	return;
1709	}
1710	// In all other cases, parse the declaration.
1711	break;
1712	default:
1713	break;
1714	}
1715
1716	bool SeenEqual = false;
1717	for (const bool InRequiresExpression =
1718	OpeningBrace && OpeningBrace->isOneOf(K1: TT_RequiresExpressionLBrace,
1719	K2: TT_CompoundRequirementLBrace);
1720	!eof();) {
1721	const FormatToken *Previous = FormatTok->Previous;
1722	switch (FormatTok->Tok.getKind()) {
1723	case tok::at:
1724	nextToken();
1725	if (FormatTok->is(Kind: tok::l_brace)) {
1726	nextToken();
1727	parseBracedList();
1728	break;
1729	}
1730	if (Style.isJava() && FormatTok->is(II: Keywords.kw_interface)) {
1731	nextToken();
1732	break;
1733	}
1734	switch (bool IsAutoRelease = false; FormatTok->Tok.getObjCKeywordID()) {
1735	case tok::objc_public:
1736	case tok::objc_protected:
1737	case tok::objc_package:
1738	case tok::objc_private:
1739	return parseAccessSpecifier();
1740	case tok::objc_interface:
1741	case tok::objc_implementation:
1742	return parseObjCInterfaceOrImplementation();
1743	case tok::objc_protocol:
1744	if (parseObjCProtocol())
1745	return;
1746	break;
1747	case tok::objc_end:
1748	return; // Handled by the caller.
1749	case tok::objc_optional:
1750	case tok::objc_required:
1751	nextToken();
1752	addUnwrappedLine();
1753	return;
1754	case tok::objc_autoreleasepool:
1755	IsAutoRelease = true;
1756	[[fallthrough]];
1757	case tok::objc_synchronized:
1758	nextToken();
1759	if (!IsAutoRelease && FormatTok->is(Kind: tok::l_paren)) {
1760	// Skip synchronization object
1761	parseParens();
1762	}
1763	if (FormatTok->is(Kind: tok::l_brace)) {
1764	if (Style.BraceWrapping.AfterControlStatement ==
1765	FormatStyle::BWACS_Always) {
1766	addUnwrappedLine();
1767	}
1768	parseBlock();
1769	}
1770	addUnwrappedLine();
1771	return;
1772	case tok::objc_try:
1773	// This branch isn't strictly necessary (the kw_try case below would
1774	// do this too after the tok::at is parsed above). But be explicit.
1775	parseTryCatch();
1776	return;
1777	default:
1778	break;
1779	}
1780	break;
1781	case tok::kw_requires: {
1782	if (IsCpp) {
1783	bool ParsedClause = parseRequires(SeenEqual);
1784	if (ParsedClause)
1785	return;
1786	} else {
1787	nextToken();
1788	}
1789	break;
1790	}
1791	case tok::kw_enum:
1792	// Ignore if this is part of "template <enum ..." or "... -> enum" or
1793	// "template <..., enum ...>".
1794	if (Previous && Previous->isOneOf(K1: tok::less, K2: tok::arrow, Ks: tok::comma)) {
1795	nextToken();
1796	break;
1797	}
1798
1799	// parseEnum falls through and does not yet add an unwrapped line as an
1800	// enum definition can start a structural element.
1801	if (!parseEnum())
1802	break;
1803	// This only applies to C++ and Verilog.
1804	if (!IsCpp && !Style.isVerilog()) {
1805	addUnwrappedLine();
1806	return;
1807	}
1808	break;
1809	case tok::kw_typedef:
1810	nextToken();
1811	if (FormatTok->isOneOf(K1: Keywords.kw_NS_ENUM, K2: Keywords.kw_NS_OPTIONS,
1812	Ks: Keywords.kw_CF_ENUM, Ks: Keywords.kw_CF_OPTIONS,
1813	Ks: Keywords.kw_CF_CLOSED_ENUM,
1814	Ks: Keywords.kw_NS_CLOSED_ENUM)) {
1815	parseEnum();
1816	}
1817	break;
1818	case tok::kw_class:
1819	if (Style.isVerilog()) {
1820	parseBlock();
1821	addUnwrappedLine();
1822	return;
1823	}
1824	if (Style.isTableGen()) {
1825	// Do nothing special. In this case the l_brace becomes FunctionLBrace.
1826	// This is same as def and so on.
1827	nextToken();
1828	break;
1829	}
1830	[[fallthrough]];
1831	case tok::kw_struct:
1832	case tok::kw_union:
1833	if (parseStructLike())
1834	return;
1835	break;
1836	case tok::kw_decltype:
1837	nextToken();
1838	if (FormatTok->is(Kind: tok::l_paren)) {
1839	parseParens();
1840	if (FormatTok->Previous &&
1841	FormatTok->Previous->endsSequence(K1: tok::r_paren, Tokens: tok::kw_auto,
1842	Tokens: tok::l_paren)) {
1843	Line ->SeenDecltypeAuto = true;
1844	}
1845	}
1846	break;
1847	case tok::period:
1848	nextToken();
1849	// In Java, classes have an implicit static member "class".
1850	if (Style.isJava() && FormatTok && FormatTok->is(Kind: tok::kw_class))
1851	nextToken();
1852	if (Style.isJavaScript() && FormatTok &&
1853	FormatTok->Tok.getIdentifierInfo()) {
1854	// JavaScript only has pseudo keywords, all keywords are allowed to
1855	// appear in "IdentifierName" positions. See http://es5.github.io/#x7.6
1856	nextToken();
1857	}
1858	break;
1859	case tok::semi:
1860	nextToken();
1861	addUnwrappedLine();
1862	return;
1863	case tok::r_brace:
1864	addUnwrappedLine();
1865	return;
1866	case tok::l_paren: {
1867	parseParens();
1868	// Break the unwrapped line if a K&R C function definition has a parameter
1869	// declaration.
1870	if (OpeningBrace \|\| !IsCpp \|\| !Previous \|\| eof())
1871	break;
1872	if (isC78ParameterDecl(Tok: FormatTok,
1873	Next: Tokens->peekNextToken(/SkipComment=/true),
1874	FuncName: Previous)) {
1875	addUnwrappedLine();
1876	return;
1877	}
1878	break;
1879	}
1880	case tok::kw_operator:
1881	nextToken();
1882	if (FormatTok->isBinaryOperator())
1883	nextToken();
1884	break;
1885	case tok::caret: {
1886	const auto *Prev = FormatTok->getPreviousNonComment();
1887	nextToken();
1888	if (Prev && Prev->is(Kind: tok::identifier))
1889	break;
1890	// Block return type.
1891	if (FormatTok->Tok.isAnyIdentifier() \|\| FormatTok->isTypeName(LangOpts)) {
1892	nextToken();
1893	// Return types: pointers are ok too.
1894	while (FormatTok->is(Kind: tok::star))
1895	nextToken();
1896	}
1897	// Block argument list.
1898	if (FormatTok->is(Kind: tok::l_paren))
1899	parseParens();
1900	// Block body.
1901	if (FormatTok->is(Kind: tok::l_brace))
1902	parseChildBlock();
1903	break;
1904	}
1905	case tok::l_brace:
1906	if (InRequiresExpression)
1907	FormatTok->setFinalizedType(TT_BracedListLBrace);
1908	if (!tryToParsePropertyAccessor() && !tryToParseBracedList()) {
1909	IsDecltypeAutoFunction = Line ->SeenDecltypeAuto;
1910	// A block outside of parentheses must be the last part of a
1911	// structural element.
1912	// FIXME: Figure out cases where this is not true, and add projections
1913	// for them (the one we know is missing are lambdas).
1914	if (Style.isJava() &&
1915	Line ->Tokens.front().Tok->is(II: Keywords.kw_synchronized)) {
1916	// If necessary, we could set the type to something different than
1917	// TT_FunctionLBrace.
1918	if (Style.BraceWrapping.AfterControlStatement ==
1919	FormatStyle::BWACS_Always) {
1920	addUnwrappedLine();
1921	}
1922	} else if (Style.BraceWrapping.AfterFunction) {
1923	addUnwrappedLine();
1924	}
1925	if (!Previous \|\| Previous->isNot(Kind: TT_TypeDeclarationParen))
1926	FormatTok->setFinalizedType(TT_FunctionLBrace);
1927	parseBlock();
1928	IsDecltypeAutoFunction = false;
1929	addUnwrappedLine();
1930	return;
1931	}
1932	// Otherwise this was a braced init list, and the structural
1933	// element continues.
1934	break;
1935	case tok::kw_try:
1936	if (Style.isJavaScript() && Line ->MustBeDeclaration) {
1937	// field/method declaration.
1938	nextToken();
1939	break;
1940	}
1941	// We arrive here when parsing function-try blocks.
1942	if (Style.BraceWrapping.AfterFunction)
1943	addUnwrappedLine();
1944	parseTryCatch();
1945	return;
1946	case tok::identifier: {
1947	if (Style.isCSharp() && FormatTok->is(II: Keywords.kw_where) &&
1948	Line ->MustBeDeclaration) {
1949	addUnwrappedLine();
1950	parseCSharpGenericTypeConstraint();
1951	break;
1952	}
1953	if (FormatTok->is(TT: TT_MacroBlockEnd)) {
1954	addUnwrappedLine();
1955	return;
1956	}
1957
1958	// Function declarations (as opposed to function expressions) are parsed
1959	// on their own unwrapped line by continuing this loop. Function
1960	// expressions (functions that are not on their own line) must not create
1961	// a new unwrapped line, so they are special cased below.
1962	size_t TokenCount = Line ->Tokens.size();
1963	if (Style.isJavaScript() && FormatTok->is(II: Keywords.kw_function) &&
1964	(TokenCount > `1` \|\|
1965	(TokenCount == `1` &&
1966	Line ->Tokens.front().Tok->isNot(Kind: Keywords.kw_async)))) {
1967	tryToParseJSFunction();
1968	break;
1969	}
1970	if ((Style.isJavaScript() \|\| Style.isJava()) &&
1971	FormatTok->is(II: Keywords.kw_interface)) {
1972	if (Style.isJavaScript()) {
1973	// In JavaScript/TypeScript, "interface" can be used as a standalone
1974	// identifier, e.g. in `var interface = 1;`. If "interface" is
1975	// followed by another identifier, it is very like to be an actual
1976	// interface declaration.
1977	unsigned StoredPosition = Tokens->getPosition();
1978	FormatToken *Next = Tokens->getNextToken();
1979	FormatTok = Tokens->setPosition(StoredPosition);
1980	if (!mustBeJSIdent(Keywords, FormatTok: Next)) {
1981	nextToken();
1982	break;
1983	}
1984	}
1985	parseRecord();
1986	addUnwrappedLine();
1987	return;
1988	}
1989
1990	if (Style.isVerilog()) {
1991	if (FormatTok->is(II: Keywords.kw_table)) {
1992	parseVerilogTable();
1993	return;
1994	}
1995	if (Keywords.isVerilogBegin(Tok: *FormatTok) \|\|
1996	Keywords.isVerilogHierarchy(Tok: *FormatTok)) {
1997	parseBlock();
1998	addUnwrappedLine();
1999	return;
2000	}
2001	}
2002
2003	if (!IsCpp && FormatTok->is(II: Keywords.kw_interface)) {
2004	if (parseStructLike())
2005	return;
2006	break;
2007	}
2008
2009	if (IsCpp && FormatTok->is(TT: TT_StatementMacro)) {
2010	parseStatementMacro();
2011	return;
2012	}
2013
2014	// See if the following token should start a new unwrapped line.
2015	StringRef Text = FormatTok->TokenText;
2016
2017	FormatToken *PreviousToken = FormatTok;
2018	nextToken();
2019
2020	// JS doesn't have macros, and within classes colons indicate fields, not
2021	// labels.
2022	if (Style.isJavaScript())
2023	break;
2024
2025	auto OneTokenSoFar = [&]() {
2026	auto I = Line ->Tokens.begin(), E = Line ->Tokens.end();
2027	while (I != E && I ->Tok->is(Kind: tok::comment))
2028	++I;
2029	if (Style.isVerilog())
2030	while (I != E && I ->Tok->is(Kind: tok::hash))
2031	++I;
2032	return I != E && (++I == E);
2033	};
2034	if (OneTokenSoFar ()) {
2035	// Recognize function-like macro usages without trailing semicolon as
2036	// well as free-standing macros like Q_OBJECT.
2037	bool FunctionLike = FormatTok->is(Kind: tok::l_paren);
2038	if (FunctionLike)
2039	parseParens();
2040
2041	bool FollowedByNewline =
2042	CommentsBeforeNextToken.empty()
2043	? FormatTok->NewlinesBefore > `0`
2044	: CommentsBeforeNextToken.front()->NewlinesBefore > `0`;
2045
2046	if (FollowedByNewline &&
2047	(Text.size() >= `5` \|\|
2048	(FunctionLike && FormatTok->isNot(Kind: tok::l_paren))) &&
2049	tokenCanStartNewLine(Tok: *FormatTok) && Text == Text.upper()) {
2050	if (PreviousToken->isNot(Kind: TT_UntouchableMacroFunc))
2051	PreviousToken->setFinalizedType(TT_FunctionLikeOrFreestandingMacro);
2052	addUnwrappedLine();
2053	return;
2054	}
2055	}
2056	break;
2057	}
2058	case tok::equal:
2059	if ((Style.isJavaScript() \|\| Style.isCSharp()) &&
2060	FormatTok->is(TT: TT_FatArrow)) {
2061	tryToParseChildBlock();
2062	break;
2063	}
2064
2065	SeenEqual = true;
2066	nextToken();
2067	if (FormatTok->is(Kind: tok::l_brace)) {
2068	// Block kind should probably be set to BK_BracedInit for any language.
2069	// C# needs this change to ensure that array initialisers and object
2070	// initialisers are indented the same way.
2071	if (Style.isCSharp())
2072	FormatTok->setBlockKind(BK_BracedInit);
2073	// TableGen's defset statement has syntax of the form,
2074	// `defset <type> <name> = { <statement>... }`
2075	if (Style.isTableGen() &&
2076	Line ->Tokens.begin()->Tok->is(II: Keywords.kw_defset)) {
2077	FormatTok->setFinalizedType(TT_FunctionLBrace);
2078	parseBlock(/MustBeDeclaration=/false, /AddLevels=/`1u`,
2079	/MunchSemi=/false);
2080	addUnwrappedLine();
2081	break;
2082	}
2083	nextToken();
2084	parseBracedList();
2085	} else if (Style.Language == FormatStyle::LK_Proto &&
2086	FormatTok->is(Kind: tok::less)) {
2087	nextToken();
2088	parseBracedList(/IsAngleBracket=/true);
2089	}
2090	break;
2091	case tok::l_square:
2092	parseSquare();
2093	break;
2094	case tok::kw_new:
2095	if (Style.isCSharp() &&
2096	(Tokens->peekNextToken()->isAccessSpecifierKeyword() \|\|
2097	(Previous && Previous->isAccessSpecifierKeyword()))) {
2098	nextToken();
2099	} else {
2100	parseNew();
2101	}
2102	break;
2103	case tok::kw_switch:
2104	if (Style.isJava())
2105	parseSwitch(/IsExpr=/true);
2106	else
2107	nextToken();
2108	break;
2109	case tok::kw_case:
2110	// Proto: there are no switch/case statements.
2111	if (Style.Language == FormatStyle::LK_Proto) {
2112	nextToken();
2113	return;
2114	}
2115	// In Verilog switch is called case.
2116	if (Style.isVerilog()) {
2117	parseBlock();
2118	addUnwrappedLine();
2119	return;
2120	}
2121	if (Style.isJavaScript() && Line ->MustBeDeclaration) {
2122	// 'case: string' field declaration.
2123	nextToken();
2124	break;
2125	}
2126	parseCaseLabel();
2127	break;
2128	case tok::kw_default:
2129	nextToken();
2130	if (Style.isVerilog()) {
2131	if (FormatTok->is(Kind: tok::colon)) {
2132	// The label will be handled in the next iteration.
2133	break;
2134	}
2135	if (FormatTok->is(II: Keywords.kw_clocking)) {
2136	// A default clocking block.
2137	parseBlock();
2138	addUnwrappedLine();
2139	return;
2140	}
2141	parseVerilogCaseLabel();
2142	return;
2143	}
2144	break;
2145	case tok::colon:
2146	nextToken();
2147	if (Style.isVerilog()) {
2148	parseVerilogCaseLabel();
2149	return;
2150	}
2151	break;
2152	case tok::greater:
2153	nextToken();
2154	if (FormatTok->is(Kind: tok::l_brace))
2155	FormatTok->Previous->setFinalizedType(TT_TemplateCloser);
2156	break;
2157	default:
2158	nextToken();
2159	break;
2160	}
2161	}
2162	}
2163
2164	bool UnwrappedLineParser::tryToParsePropertyAccessor() {
2165	assert(FormatTok->is(tok::l_brace));
2166	if (!Style.isCSharp())
2167	return false;
2168	// See if it's a property accessor.
2169	if (!FormatTok->Previous \|\| FormatTok->Previous->isNot(Kind: tok::identifier))
2170	return false;
2171
2172	// See if we are inside a property accessor.
2173	//
2174	// Record the current tokenPosition so that we can advance and
2175	// reset the current token. `Next` is not set yet so we need
2176	// another way to advance along the token stream.
2177	unsigned int StoredPosition = Tokens->getPosition();
2178	FormatToken *Tok = Tokens->getNextToken();
2179
2180	// A trivial property accessor is of the form:
2181	// { [ACCESS_SPECIFIER] [get]; [ACCESS_SPECIFIER] [set\|init] }
2182	// Track these as they do not require line breaks to be introduced.
2183	bool HasSpecialAccessor = false;
2184	bool IsTrivialPropertyAccessor = true;
2185	bool HasAttribute = false;
2186	while (!eof()) {
2187	if (const bool IsAccessorKeyword =
2188	Tok->isOneOf(K1: Keywords.kw_get, K2: Keywords.kw_init, Ks: Keywords.kw_set);
2189	IsAccessorKeyword \|\| Tok->isAccessSpecifierKeyword() \|\|
2190	Tok->isOneOf(K1: tok::l_square, K2: tok::semi, Ks: Keywords.kw_internal)) {
2191	if (IsAccessorKeyword)
2192	HasSpecialAccessor = true;
2193	else if (Tok->is(Kind: tok::l_square))
2194	HasAttribute = true;
2195	Tok = Tokens->getNextToken();
2196	continue;
2197	}
2198	if (Tok->isNot(Kind: tok::r_brace))
2199	IsTrivialPropertyAccessor = false;
2200	break;
2201	}
2202
2203	if (!HasSpecialAccessor \|\| HasAttribute) {
2204	Tokens->setPosition(StoredPosition);
2205	return false;
2206	}
2207
2208	// Try to parse the property accessor:
2209	// https://docs.microsoft.com/en-us/dotnet/csharp/programming-guide/classes-and-structs/properties
2210	Tokens->setPosition(StoredPosition);
2211	if (!IsTrivialPropertyAccessor && Style.BraceWrapping.AfterFunction)
2212	addUnwrappedLine();
2213	nextToken();
2214	do {
2215	switch (FormatTok->Tok.getKind()) {
2216	case tok::r_brace:
2217	nextToken();
2218	if (FormatTok->is(Kind: tok::equal)) {
2219	while (!eof() && FormatTok->isNot(Kind: tok::semi))
2220	nextToken();
2221	nextToken();
2222	}
2223	addUnwrappedLine();
2224	return true;
2225	case tok::l_brace:
2226	++Line ->Level;
2227	parseBlock(/MustBeDeclaration=/true);
2228	addUnwrappedLine();
2229	--Line ->Level;
2230	break;
2231	case tok::equal:
2232	if (FormatTok->is(TT: TT_FatArrow)) {
2233	++Line ->Level;
2234	do {
2235	nextToken();
2236	} while (!eof() && FormatTok->isNot(Kind: tok::semi));
2237	nextToken();
2238	addUnwrappedLine();
2239	--Line ->Level;
2240	break;
2241	}
2242	nextToken();
2243	break;
2244	default:
2245	if (FormatTok->isOneOf(K1: Keywords.kw_get, K2: Keywords.kw_init,
2246	Ks: Keywords.kw_set) &&
2247	!IsTrivialPropertyAccessor) {
2248	// Non-trivial get/set needs to be on its own line.
2249	addUnwrappedLine();
2250	}
2251	nextToken();
2252	}
2253	} while (!eof());
2254
2255	// Unreachable for well-formed code (paired '{' and '}').
2256	return true;
2257	}
2258
2259	bool UnwrappedLineParser::tryToParseLambda() {
2260	assert(FormatTok->is(tok::l_square));
2261	if (!IsCpp) {
2262	nextToken();
2263	return false;
2264	}
2265	FormatToken &LSquare = *FormatTok;
2266	if (!tryToParseLambdaIntroducer())
2267	return false;
2268
2269	bool SeenArrow = false;
2270	bool InTemplateParameterList = false;
2271
2272	while (FormatTok->isNot(Kind: tok::l_brace)) {
2273	if (FormatTok->isTypeName(LangOpts) \|\| FormatTok->isAttribute()) {
2274	nextToken();
2275	continue;
2276	}
2277	switch (FormatTok->Tok.getKind()) {
2278	case tok::l_brace:
2279	break;
2280	case tok::l_paren:
2281	parseParens(/AmpAmpTokenType=/TT_PointerOrReference);
2282	break;
2283	case tok::l_square:
2284	parseSquare();
2285	break;
2286	case tok::less:
2287	assert(FormatTok->Previous);
2288	if (FormatTok->Previous->is(Kind: tok::r_square))
2289	InTemplateParameterList = true;
2290	nextToken();
2291	break;
2292	case tok::kw_auto:
2293	case tok::kw_class:
2294	case tok::kw_struct:
2295	case tok::kw_union:
2296	case tok::kw_template:
2297	case tok::kw_typename:
2298	case tok::amp:
2299	case tok::star:
2300	case tok::kw_const:
2301	case tok::kw_constexpr:
2302	case tok::kw_consteval:
2303	case tok::comma:
2304	case tok::greater:
2305	case tok::identifier:
2306	case tok::numeric_constant:
2307	case tok::coloncolon:
2308	case tok::kw_mutable:
2309	case tok::kw_noexcept:
2310	case tok::kw_static:
2311	nextToken();
2312	break;
2313	// Specialization of a template with an integer parameter can contain
2314	// arithmetic, logical, comparison and ternary operators.
2315	//
2316	// FIXME: This also accepts sequences of operators that are not in the scope
2317	// of a template argument list.
2318	//
2319	// In a C++ lambda a template type can only occur after an arrow. We use
2320	// this as an heuristic to distinguish between Objective-C expressions
2321	// followed by an `a->b` expression, such as:
2322	// ([obj func:arg] + a->b)
2323	// Otherwise the code below would parse as a lambda.
2324	case tok::plus:
2325	case tok::minus:
2326	case tok::exclaim:
2327	case tok::tilde:
2328	case tok::slash:
2329	case tok::percent:
2330	case tok::lessless:
2331	case tok::pipe:
2332	case tok::pipepipe:
2333	case tok::ampamp:
2334	case tok::caret:
2335	case tok::equalequal:
2336	case tok::exclaimequal:
2337	case tok::greaterequal:
2338	case tok::lessequal:
2339	case tok::question:
2340	case tok::colon:
2341	case tok::ellipsis:
2342	case tok::kw_true:
2343	case tok::kw_false:
2344	if (SeenArrow \|\| InTemplateParameterList) {
2345	nextToken();
2346	break;
2347	}
2348	return true;
2349	case tok::arrow:
2350	// This might or might not actually be a lambda arrow (this could be an
2351	// ObjC method invocation followed by a dereferencing arrow). We might
2352	// reset this back to TT_Unknown in TokenAnnotator.
2353	FormatTok->setFinalizedType(TT_LambdaArrow);
2354	SeenArrow = true;
2355	nextToken();
2356	break;
2357	case tok::kw_requires: {
2358	auto *RequiresToken = FormatTok;
2359	nextToken();
2360	parseRequiresClause(RequiresToken);
2361	break;
2362	}
2363	case tok::equal:
2364	if (!InTemplateParameterList)
2365	return true;
2366	nextToken();
2367	break;
2368	default:
2369	return true;
2370	}
2371	}
2372
2373	FormatTok->setFinalizedType(TT_LambdaLBrace);
2374	LSquare.setFinalizedType(TT_LambdaLSquare);
2375
2376	NestedLambdas.push_back(Elt: Line ->SeenDecltypeAuto);
2377	parseChildBlock();
2378	assert(!NestedLambdas.empty());
2379	NestedLambdas.pop_back();
2380
2381	return true;
2382	}
2383
2384	bool UnwrappedLineParser::tryToParseLambdaIntroducer() {
2385	const FormatToken *Previous = FormatTok->Previous;
2386	const FormatToken *LeftSquare = FormatTok;
2387	nextToken();
2388	if (Previous) {
2389	if (Previous->Tok.getIdentifierInfo() &&
2390	!Previous->isOneOf(K1: tok::kw_return, K2: tok::kw_co_await, Ks: tok::kw_co_yield,
2391	Ks: tok::kw_co_return)) {
2392	return false;
2393	}
2394	if (Previous->closesScope()) {
2395	// Not a potential C-style cast.
2396	if (Previous->isNot(Kind: tok::r_paren))
2397	return false;
2398	const auto *BeforeRParen = Previous->getPreviousNonComment();
2399	// Lambdas can be cast to function types only, e.g. `std::function<int()>`
2400	// and `int ()()`.*
2401	if (!BeforeRParen \|\| !BeforeRParen->isOneOf(K1: tok::greater, K2: tok::r_paren))
2402	return false;
2403	}
2404	}
2405	if (LeftSquare->isCppStructuredBinding(IsCpp))
2406	return false;
2407	if (FormatTok->is(Kind: tok::l_square) \|\| tok::isLiteral(K: FormatTok->Tok.getKind()))
2408	return false;
2409	if (FormatTok->is(Kind: tok::r_square)) {
2410	const FormatToken Next = Tokens->peekNextToken(/SkipComment=/*true);
2411	if (Next->is(Kind: tok::greater))
2412	return false;
2413	}
2414	parseSquare(/LambdaIntroducer=/true);
2415	return true;
2416	}
2417
2418	void UnwrappedLineParser::tryToParseJSFunction() {
2419	assert(FormatTok->is(Keywords.kw_function));
2420	if (FormatTok->is(II: Keywords.kw_async))
2421	nextToken();
2422	// Consume "function".
2423	nextToken();
2424
2425	// Consume (generator function). Treat it like C++'s overloaded operators.*
2426	if (FormatTok->is(Kind: tok::star)) {
2427	FormatTok->setFinalizedType(TT_OverloadedOperator);
2428	nextToken();
2429	}
2430
2431	// Consume function name.
2432	if (FormatTok->is(Kind: tok::identifier))
2433	nextToken();
2434
2435	if (FormatTok->isNot(Kind: tok::l_paren))
2436	return;
2437
2438	// Parse formal parameter list.
2439	parseParens();
2440
2441	if (FormatTok->is(Kind: tok::colon)) {
2442	// Parse a type definition.
2443	nextToken();
2444
2445	// Eat the type declaration. For braced inline object types, balance braces,
2446	// otherwise just parse until finding an l_brace for the function body.
2447	if (FormatTok->is(Kind: tok::l_brace))
2448	tryToParseBracedList();
2449	else
2450	while (!FormatTok->isOneOf(K1: tok::l_brace, K2: tok::semi) && !eof())
2451	nextToken();
2452	}
2453
2454	if (FormatTok->is(Kind: tok::semi))
2455	return;
2456
2457	parseChildBlock();
2458	}
2459
2460	bool UnwrappedLineParser::tryToParseBracedList() {
2461	if (FormatTok->is(BBK: BK_Unknown))
2462	calculateBraceTypes();
2463	assert(FormatTok->isNot(BK_Unknown));
2464	if (FormatTok->is(BBK: BK_Block))
2465	return false;
2466	nextToken();
2467	parseBracedList();
2468	return true;
2469	}
2470
2471	bool UnwrappedLineParser::tryToParseChildBlock() {
2472	assert(Style.isJavaScript() \|\| Style.isCSharp());
2473	assert(FormatTok->is(TT_FatArrow));
2474	// Fat arrows (=>) have tok::TokenKind tok::equal but TokenType TT_FatArrow.
2475	// They always start an expression or a child block if followed by a curly
2476	// brace.
2477	nextToken();
2478	if (FormatTok->isNot(Kind: tok::l_brace))
2479	return false;
2480	parseChildBlock();
2481	return true;
2482	}
2483
2484	bool UnwrappedLineParser::parseBracedList(bool IsAngleBracket, bool IsEnum) {
2485	assert(!IsAngleBracket \|\| !IsEnum);
2486	bool HasError = false;
2487
2488	// FIXME: Once we have an expression parser in the UnwrappedLineParser,
2489	// replace this by using parseAssignmentExpression() inside.
2490	do {
2491	if (Style.isCSharp() && FormatTok->is(TT: TT_FatArrow) &&
2492	tryToParseChildBlock()) {
2493	continue;
2494	}
2495	if (Style.isJavaScript()) {
2496	if (FormatTok->is(II: Keywords.kw_function)) {
2497	tryToParseJSFunction();
2498	continue;
2499	}
2500	if (FormatTok->is(Kind: tok::l_brace)) {
2501	// Could be a method inside of a braced list `{a() { return 1; }}`.
2502	if (tryToParseBracedList())
2503	continue;
2504	parseChildBlock();
2505	}
2506	}
2507	if (FormatTok->is(Kind: IsAngleBracket ? tok::greater : tok::r_brace)) {
2508	if (IsEnum) {
2509	FormatTok->setBlockKind(BK_Block);
2510	if (!Style.AllowShortEnumsOnASingleLine)
2511	addUnwrappedLine();
2512	}
2513	nextToken();
2514	return !HasError;
2515	}
2516	switch (FormatTok->Tok.getKind()) {
2517	case tok::l_square:
2518	if (Style.isCSharp())
2519	parseSquare();
2520	else
2521	tryToParseLambda();
2522	break;
2523	case tok::l_paren:
2524	parseParens();
2525	// JavaScript can just have free standing methods and getters/setters in
2526	// object literals. Detect them by a "{" following ")".
2527	if (Style.isJavaScript()) {
2528	if (FormatTok->is(Kind: tok::l_brace))
2529	parseChildBlock();
2530	break;
2531	}
2532	break;
2533	case tok::l_brace:
2534	// Assume there are no blocks inside a braced init list apart
2535	// from the ones we explicitly parse out (like lambdas).
2536	FormatTok->setBlockKind(BK_BracedInit);
2537	if (!IsAngleBracket) {
2538	auto *Prev = FormatTok->Previous;
2539	if (Prev && Prev->is(Kind: tok::greater))
2540	Prev->setFinalizedType(TT_TemplateCloser);
2541	}
2542	nextToken();
2543	parseBracedList();
2544	break;
2545	case tok::less:
2546	nextToken();
2547	if (IsAngleBracket)
2548	parseBracedList(/IsAngleBracket=/true);
2549	break;
2550	case tok::semi:
2551	// JavaScript (or more precisely TypeScript) can have semicolons in braced
2552	// lists (in so-called TypeMemberLists). Thus, the semicolon cannot be
2553	// used for error recovery if we have otherwise determined that this is
2554	// a braced list.
2555	if (Style.isJavaScript()) {
2556	nextToken();
2557	break;
2558	}
2559	HasError = true;
2560	if (!IsEnum)
2561	return false;
2562	nextToken();
2563	break;
2564	case tok::comma:
2565	nextToken();
2566	if (IsEnum && !Style.AllowShortEnumsOnASingleLine)
2567	addUnwrappedLine();
2568	break;
2569	default:
2570	nextToken();
2571	break;
2572	}
2573	} while (!eof());
2574	return false;
2575	}
2576
2577	/// Parses a pair of parentheses (and everything between them).
2578	/// \param AmpAmpTokenType If different than TT_Unknown sets this type for all
2579	/// double ampersands. This applies for all nested scopes as well.
2580	///
2581	/// Returns whether there is a `=` token between the parentheses.
2582	bool UnwrappedLineParser::parseParens(TokenType AmpAmpTokenType) {
2583	assert(FormatTok->is(tok::l_paren) && "'(' expected.");
2584	auto *LParen = FormatTok;
2585	bool SeenComma = false;
2586	bool SeenEqual = false;
2587	bool MightBeFoldExpr = false;
2588	nextToken();
2589	const bool MightBeStmtExpr = FormatTok->is(Kind: tok::l_brace);
2590	do {
2591	switch (FormatTok->Tok.getKind()) {
2592	case tok::l_paren:
2593	if (parseParens(AmpAmpTokenType))
2594	SeenEqual = true;
2595	if (Style.isJava() && FormatTok->is(Kind: tok::l_brace))
2596	parseChildBlock();
2597	break;
2598	case tok::r_paren: {
2599	auto *Prev = LParen->Previous;
2600	auto *RParen = FormatTok;
2601	nextToken();
2602	if (Prev) {
2603	auto OptionalParens = [&] {
2604	if (MightBeStmtExpr \|\| MightBeFoldExpr \|\| Line ->InMacroBody \|\|
2605	SeenComma \|\| Style.RemoveParentheses == FormatStyle::RPS_Leave \|\|
2606	RParen->getPreviousNonComment() == LParen) {
2607	return false;
2608	}
2609	const bool DoubleParens =
2610	Prev->is(Kind: tok::l_paren) && FormatTok->is(Kind: tok::r_paren);
2611	if (DoubleParens) {
2612	const auto *PrevPrev = Prev->getPreviousNonComment();
2613	const bool Excluded =
2614	PrevPrev &&
2615	(PrevPrev->isOneOf(K1: tok::kw___attribute, K2: tok::kw_decltype) \|\|
2616	(SeenEqual &&
2617	(PrevPrev->isOneOf(K1: tok::kw_if, K2: tok::kw_while) \|\|
2618	PrevPrev->endsSequence(K1: tok::kw_constexpr, Tokens: tok::kw_if))));
2619	if (!Excluded)
2620	return true;
2621	} else {
2622	const bool CommaSeparated =
2623	Prev->isOneOf(K1: tok::l_paren, K2: tok::comma) &&
2624	FormatTok->isOneOf(K1: tok::comma, K2: tok::r_paren);
2625	if (CommaSeparated &&
2626	// LParen is not preceded by ellipsis, comma.
2627	!Prev->endsSequence(K1: tok::comma, Tokens: tok::ellipsis) &&
2628	// RParen is not followed by comma, ellipsis.
2629	!(FormatTok->is(Kind: tok::comma) &&
2630	Tokens->peekNextToken()->is(Kind: tok::ellipsis))) {
2631	return true;
2632	}
2633	const bool ReturnParens =
2634	Style.RemoveParentheses == FormatStyle::RPS_ReturnStatement &&
2635	((NestedLambdas.empty() && !IsDecltypeAutoFunction) \|\|
2636	(!NestedLambdas.empty() && !NestedLambdas.back())) &&
2637	Prev->isOneOf(K1: tok::kw_return, K2: tok::kw_co_return) &&
2638	FormatTok->is(Kind: tok::semi);
2639	if (ReturnParens)
2640	return true;
2641	}
2642	return false;
2643	};
2644	if (Prev->is(TT: TT_TypenameMacro)) {
2645	LParen->setFinalizedType(TT_TypeDeclarationParen);
2646	RParen->setFinalizedType(TT_TypeDeclarationParen);
2647	} else if (Prev->is(Kind: tok::greater) && RParen->Previous == LParen) {
2648	Prev->setFinalizedType(TT_TemplateCloser);
2649	} else if (OptionalParens ()) {
2650	LParen->Optional = true;
2651	RParen->Optional = true;
2652	}
2653	}
2654	return SeenEqual;
2655	}
2656	case tok::r_brace:
2657	// A "}" inside parenthesis is an error if there wasn't a matching "{".
2658	return SeenEqual;
2659	case tok::l_square:
2660	tryToParseLambda();
2661	break;
2662	case tok::l_brace:
2663	if (!tryToParseBracedList())
2664	parseChildBlock();
2665	break;
2666	case tok::at:
2667	nextToken();
2668	if (FormatTok->is(Kind: tok::l_brace)) {
2669	nextToken();
2670	parseBracedList();
2671	}
2672	break;
2673	case tok::comma:
2674	SeenComma = true;
2675	nextToken();
2676	break;
2677	case tok::ellipsis:
2678	MightBeFoldExpr = true;
2679	nextToken();
2680	break;
2681	case tok::equal:
2682	SeenEqual = true;
2683	if (Style.isCSharp() && FormatTok->is(TT: TT_FatArrow))
2684	tryToParseChildBlock();
2685	else
2686	nextToken();
2687	break;
2688	case tok::kw_class:
2689	if (Style.isJavaScript())
2690	parseRecord(/ParseAsExpr=/true);
2691	else
2692	nextToken();
2693	break;
2694	case tok::identifier:
2695	if (Style.isJavaScript() && (FormatTok->is(II: Keywords.kw_function)))
2696	tryToParseJSFunction();
2697	else
2698	nextToken();
2699	break;
2700	case tok::kw_switch:
2701	if (Style.isJava())
2702	parseSwitch(/IsExpr=/true);
2703	else
2704	nextToken();
2705	break;
2706	case tok::kw_requires: {
2707	auto RequiresToken = FormatTok;
2708	nextToken();
2709	parseRequiresExpression(RequiresToken);
2710	break;
2711	}
2712	case tok::ampamp:
2713	if (AmpAmpTokenType != TT_Unknown)
2714	FormatTok->setFinalizedType(AmpAmpTokenType);
2715	[[fallthrough]];
2716	default:
2717	nextToken();
2718	break;
2719	}
2720	} while (!eof());
2721	return SeenEqual;
2722	}
2723
2724	void UnwrappedLineParser::parseSquare(bool LambdaIntroducer) {
2725	if (!LambdaIntroducer) {
2726	assert(FormatTok->is(tok::l_square) && "'[' expected.");
2727	if (tryToParseLambda())
2728	return;
2729	}
2730	do {
2731	switch (FormatTok->Tok.getKind()) {
2732	case tok::l_paren:
2733	parseParens();
2734	break;
2735	case tok::r_square:
2736	nextToken();
2737	return;
2738	case tok::r_brace:
2739	// A "}" inside parenthesis is an error if there wasn't a matching "{".
2740	return;
2741	case tok::l_square:
2742	parseSquare();
2743	break;
2744	case tok::l_brace: {
2745	if (!tryToParseBracedList())
2746	parseChildBlock();
2747	break;
2748	}
2749	case tok::at:
2750	case tok::colon:
2751	nextToken();
2752	if (FormatTok->is(Kind: tok::l_brace)) {
2753	nextToken();
2754	parseBracedList();
2755	}
2756	break;
2757	default:
2758	nextToken();
2759	break;
2760	}
2761	} while (!eof());
2762	}
2763
2764	void UnwrappedLineParser::keepAncestorBraces() {
2765	if (!Style.RemoveBracesLLVM)
2766	return;
2767
2768	const int MaxNestingLevels = `2`;
2769	const int Size = NestedTooDeep.size();
2770	if (Size >= MaxNestingLevels)
2771	NestedTooDeep [Size - MaxNestingLevels] = true;
2772	NestedTooDeep.push_back(Elt: false);
2773	}
2774
2775	static FormatToken getLastNonComment(const* UnwrappedLine &Line) {
2776	for (const auto &Token : llvm::reverse(C: Line.Tokens))
2777	if (Token.Tok->isNot(Kind: tok::comment))
2778	return Token.Tok;
2779
2780	return nullptr;
2781	}
2782
2783	void UnwrappedLineParser::parseUnbracedBody(bool CheckEOF) {
2784	FormatToken Tok = nullptr*;
2785
2786	if (Style.InsertBraces && !Line ->InPPDirective && !Line ->Tokens.empty() &&
2787	PreprocessorDirectives.empty() && FormatTok->isNot(Kind: tok::semi)) {
2788	Tok = Style.BraceWrapping.AfterControlStatement == FormatStyle::BWACS_Never
2789	? getLastNonComment(Line: *Line)
2790	: Line ->Tokens.back().Tok;
2791	assert(Tok);
2792	if (Tok->BraceCount < `0`) {
2793	assert(Tok->BraceCount == -`1`);
2794	Tok = nullptr;
2795	} else {
2796	Tok->BraceCount = -`1`;
2797	}
2798	}
2799
2800	addUnwrappedLine();
2801	++Line ->Level;
2802	++Line ->UnbracedBodyLevel;
2803	parseStructuralElement();
2804	--Line ->UnbracedBodyLevel;
2805
2806	if (Tok) {
2807	assert(!Line->InPPDirective);
2808	Tok = nullptr;
2809	for (const auto &L : llvm::reverse(C&: *CurrentLines)) {
2810	if (!L.InPPDirective && getLastNonComment(Line: L)) {
2811	Tok = L.Tokens.back().Tok;
2812	break;
2813	}
2814	}
2815	assert(Tok);
2816	++Tok->BraceCount;
2817	}
2818
2819	if (CheckEOF && eof())
2820	addUnwrappedLine();
2821
2822	--Line ->Level;
2823	}
2824
2825	static void markOptionalBraces(FormatToken *LeftBrace) {
2826	if (!LeftBrace)
2827	return;
2828
2829	assert(LeftBrace->is(tok::l_brace));
2830
2831	FormatToken *RightBrace = LeftBrace->MatchingParen;
2832	if (!RightBrace) {
2833	assert(!LeftBrace->Optional);
2834	return;
2835	}
2836
2837	assert(RightBrace->is(tok::r_brace));
2838	assert(RightBrace->MatchingParen == LeftBrace);
2839	assert(LeftBrace->Optional == RightBrace->Optional);
2840
2841	LeftBrace->Optional = true;
2842	RightBrace->Optional = true;
2843	}
2844
2845	void UnwrappedLineParser::handleAttributes() {
2846	// Handle AttributeMacro, e.g. `if (x) UNLIKELY`.
2847	if (FormatTok->isAttribute())
2848	nextToken();
2849	else if (FormatTok->is(Kind: tok::l_square))
2850	handleCppAttributes();
2851	}
2852
2853	bool UnwrappedLineParser::handleCppAttributes() {
2854	// Handle [[likely]] / [[unlikely]] attributes.
2855	assert(FormatTok->is(tok::l_square));
2856	if (!tryToParseSimpleAttribute())
2857	return false;
2858	parseSquare();
2859	return true;
2860	}
2861
2862	/// Returns whether \c Tok begins a block.
2863	bool UnwrappedLineParser::isBlockBegin(const FormatToken &Tok) const {
2864	// FIXME: rename the function or make
2865	// Tok.isOneOf(tok::l_brace, TT_MacroBlockBegin) work.
2866	return Style.isVerilog() ? Keywords.isVerilogBegin(Tok)
2867	: Tok.is(Kind: tok::l_brace);
2868	}
2869
2870	FormatToken UnwrappedLineParser::parseIfThenElse(IfStmtKind IfKind,
2871	bool KeepBraces,
2872	bool IsVerilogAssert) {
2873	assert((FormatTok->is(tok::kw_if) \|\|
2874	(Style.isVerilog() &&
2875	FormatTok->isOneOf(tok::kw_restrict, Keywords.kw_assert,
2876	Keywords.kw_assume, Keywords.kw_cover))) &&
2877	"'if' expected");
2878	nextToken();
2879
2880	if (IsVerilogAssert) {
2881	// Handle `assert #0` and `assert final`.
2882	if (FormatTok->is(II: Keywords.kw_verilogHash)) {
2883	nextToken();
2884	if (FormatTok->is(Kind: tok::numeric_constant))
2885	nextToken();
2886	} else if (FormatTok->isOneOf(K1: Keywords.kw_final, K2: Keywords.kw_property,
2887	Ks: Keywords.kw_sequence)) {
2888	nextToken();
2889	}
2890	}
2891
2892	// TableGen's if statement has the form of `if <cond> then { ... }`.
2893	if (Style.isTableGen()) {
2894	while (!eof() && FormatTok->isNot(Kind: Keywords.kw_then)) {
2895	// Simply skip until then. This range only contains a value.
2896	nextToken();
2897	}
2898	}
2899
2900	// Handle `if !consteval`.
2901	if (FormatTok->is(Kind: tok::exclaim))
2902	nextToken();
2903
2904	bool KeepIfBraces = true;
2905	if (FormatTok->is(Kind: tok::kw_consteval)) {
2906	nextToken();
2907	} else {
2908	KeepIfBraces = !Style.RemoveBracesLLVM \|\| KeepBraces;
2909	if (FormatTok->isOneOf(K1: tok::kw_constexpr, K2: tok::identifier))
2910	nextToken();
2911	if (FormatTok->is(Kind: tok::l_paren)) {
2912	FormatTok->setFinalizedType(TT_ConditionLParen);
2913	parseParens();
2914	}
2915	}
2916	handleAttributes();
2917	// The then action is optional in Verilog assert statements.
2918	if (IsVerilogAssert && FormatTok->is(Kind: tok::semi)) {
2919	nextToken();
2920	addUnwrappedLine();
2921	return nullptr;
2922	}
2923
2924	bool NeedsUnwrappedLine = false;
2925	keepAncestorBraces();
2926
2927	FormatToken IfLeftBrace = nullptr*;
2928	IfStmtKind IfBlockKind = IfStmtKind::NotIf;
2929
2930	if (isBlockBegin(Tok: *FormatTok)) {
2931	FormatTok->setFinalizedType(TT_ControlStatementLBrace);
2932	IfLeftBrace = FormatTok;
2933	CompoundStatementIndenter Indenter(this, Style, Line ->Level);
2934	parseBlock(/MustBeDeclaration=/false, /AddLevels=/`1u`,
2935	/MunchSemi=/true, KeepBraces: KeepIfBraces, IfKind: &IfBlockKind);
2936	setPreviousRBraceType(TT_ControlStatementRBrace);
2937	if (Style.BraceWrapping.BeforeElse)
2938	addUnwrappedLine();
2939	else
2940	NeedsUnwrappedLine = true;
2941	} else if (IsVerilogAssert && FormatTok->is(Kind: tok::kw_else)) {
2942	addUnwrappedLine();
2943	} else {
2944	parseUnbracedBody();
2945	}
2946
2947	if (Style.RemoveBracesLLVM) {
2948	assert(!NestedTooDeep.empty());
2949	KeepIfBraces = KeepIfBraces \|\|
2950	(IfLeftBrace && !IfLeftBrace->MatchingParen) \|\|
2951	NestedTooDeep.back() \|\| IfBlockKind == IfStmtKind::IfOnly \|\|
2952	IfBlockKind == IfStmtKind::IfElseIf;
2953	}
2954
2955	bool KeepElseBraces = KeepIfBraces;
2956	FormatToken ElseLeftBrace = nullptr*;
2957	IfStmtKind Kind = IfStmtKind::IfOnly;
2958
2959	if (FormatTok->is(Kind: tok::kw_else)) {
2960	if (Style.RemoveBracesLLVM) {
2961	NestedTooDeep.back() = false;
2962	Kind = IfStmtKind::IfElse;
2963	}
2964	nextToken();
2965	handleAttributes();
2966	if (isBlockBegin(Tok: *FormatTok)) {
2967	const bool FollowedByIf = Tokens->peekNextToken()->is(Kind: tok::kw_if);
2968	FormatTok->setFinalizedType(TT_ElseLBrace);
2969	ElseLeftBrace = FormatTok;
2970	CompoundStatementIndenter Indenter(this, Style, Line ->Level);
2971	IfStmtKind ElseBlockKind = IfStmtKind::NotIf;
2972	FormatToken *IfLBrace =
2973	parseBlock(/MustBeDeclaration=/false, /AddLevels=/`1u`,
2974	/MunchSemi=/true, KeepBraces: KeepElseBraces, IfKind: &ElseBlockKind);
2975	setPreviousRBraceType(TT_ElseRBrace);
2976	if (FormatTok->is(Kind: tok::kw_else)) {
2977	KeepElseBraces = KeepElseBraces \|\|
2978	ElseBlockKind == IfStmtKind::IfOnly \|\|
2979	ElseBlockKind == IfStmtKind::IfElseIf;
2980	} else if (FollowedByIf && IfLBrace && !IfLBrace->Optional) {
2981	KeepElseBraces = true;
2982	assert(ElseLeftBrace->MatchingParen);
2983	markOptionalBraces(LeftBrace: ElseLeftBrace);
2984	}
2985	addUnwrappedLine();
2986	} else if (!IsVerilogAssert && FormatTok->is(Kind: tok::kw_if)) {
2987	const FormatToken *Previous = Tokens->getPreviousToken();
2988	assert(Previous);
2989	const bool IsPrecededByComment = Previous->is(Kind: tok::comment);
2990	if (IsPrecededByComment) {
2991	addUnwrappedLine();
2992	++Line ->Level;
2993	}
2994	bool TooDeep = true;
2995	if (Style.RemoveBracesLLVM) {
2996	Kind = IfStmtKind::IfElseIf;
2997	TooDeep = NestedTooDeep.pop_back_val();
2998	}
2999	ElseLeftBrace = parseIfThenElse(/IfKind=/nullptr, KeepBraces: KeepIfBraces);
3000	if (Style.RemoveBracesLLVM)
3001	NestedTooDeep.push_back(Elt: TooDeep);
3002	if (IsPrecededByComment)
3003	--Line ->Level;
3004	} else {
3005	parseUnbracedBody(/CheckEOF=/true);
3006	}
3007	} else {
3008	KeepIfBraces = KeepIfBraces \|\| IfBlockKind == IfStmtKind::IfElse;
3009	if (NeedsUnwrappedLine)
3010	addUnwrappedLine();
3011	}
3012
3013	if (!Style.RemoveBracesLLVM)
3014	return nullptr;
3015
3016	assert(!NestedTooDeep.empty());
3017	KeepElseBraces = KeepElseBraces \|\|
3018	(ElseLeftBrace && !ElseLeftBrace->MatchingParen) \|\|
3019	NestedTooDeep.back();
3020
3021	NestedTooDeep.pop_back();
3022
3023	if (!KeepIfBraces && !KeepElseBraces) {
3024	markOptionalBraces(LeftBrace: IfLeftBrace);
3025	markOptionalBraces(LeftBrace: ElseLeftBrace);
3026	} else if (IfLeftBrace) {
3027	FormatToken *IfRightBrace = IfLeftBrace->MatchingParen;
3028	if (IfRightBrace) {
3029	assert(IfRightBrace->MatchingParen == IfLeftBrace);
3030	assert(!IfLeftBrace->Optional);
3031	assert(!IfRightBrace->Optional);
3032	IfLeftBrace->MatchingParen = nullptr;
3033	IfRightBrace->MatchingParen = nullptr;
3034	}
3035	}
3036
3037	if (IfKind)
3038	*IfKind = Kind;
3039
3040	return IfLeftBrace;
3041	}
3042
3043	void UnwrappedLineParser::parseTryCatch() {
3044	assert(FormatTok->isOneOf(tok::kw_try, tok::kw___try) && "'try' expected");
3045	nextToken();
3046	bool NeedsUnwrappedLine = false;
3047	bool HasCtorInitializer = false;
3048	if (FormatTok->is(Kind: tok::colon)) {
3049	auto *Colon = FormatTok;
3050	// We are in a function try block, what comes is an initializer list.
3051	nextToken();
3052	if (FormatTok->is(Kind: tok::identifier)) {
3053	HasCtorInitializer = true;
3054	Colon->setFinalizedType(TT_CtorInitializerColon);
3055	}
3056
3057	// In case identifiers were removed by clang-tidy, what might follow is
3058	// multiple commas in sequence - before the first identifier.
3059	while (FormatTok->is(Kind: tok::comma))
3060	nextToken();
3061
3062	while (FormatTok->is(Kind: tok::identifier)) {
3063	nextToken();
3064	if (FormatTok->is(Kind: tok::l_paren)) {
3065	parseParens();
3066	} else if (FormatTok->is(Kind: tok::l_brace)) {
3067	nextToken();
3068	parseBracedList();
3069	}
3070
3071	// In case identifiers were removed by clang-tidy, what might follow is
3072	// multiple commas in sequence - after the first identifier.
3073	while (FormatTok->is(Kind: tok::comma))
3074	nextToken();
3075	}
3076	}
3077	// Parse try with resource.
3078	if (Style.isJava() && FormatTok->is(Kind: tok::l_paren))
3079	parseParens();
3080
3081	keepAncestorBraces();
3082
3083	if (FormatTok->is(Kind: tok::l_brace)) {
3084	if (HasCtorInitializer)
3085	FormatTok->setFinalizedType(TT_FunctionLBrace);
3086	CompoundStatementIndenter Indenter(this, Style, Line ->Level);
3087	parseBlock();
3088	if (Style.BraceWrapping.BeforeCatch)
3089	addUnwrappedLine();
3090	else
3091	NeedsUnwrappedLine = true;
3092	} else if (FormatTok->isNot(Kind: tok::kw_catch)) {
3093	// The C++ standard requires a compound-statement after a try.
3094	// If there's none, we try to assume there's a structuralElement
3095	// and try to continue.
3096	addUnwrappedLine();
3097	++Line ->Level;
3098	parseStructuralElement();
3099	--Line ->Level;
3100	}
3101	for (bool SeenCatch = false;;) {
3102	if (FormatTok->is(Kind: tok::at))
3103	nextToken();
3104	if (!(FormatTok->isOneOf(K1: tok::kw_catch, K2: Keywords.kw___except,
3105	Ks: tok::kw___finally, Ks: tok::objc_catch,
3106	Ks: tok::objc_finally) \|\|
3107	((Style.isJava() \|\| Style.isJavaScript()) &&
3108	FormatTok->is(II: Keywords.kw_finally)))) {
3109	break;
3110	}
3111	if (FormatTok->is(Kind: tok::kw_catch))
3112	SeenCatch = true;
3113	nextToken();
3114	while (FormatTok->isNot(Kind: tok::l_brace)) {
3115	if (FormatTok->is(Kind: tok::l_paren)) {
3116	parseParens();
3117	continue;
3118	}
3119	if (FormatTok->isOneOf(K1: tok::semi, K2: tok::r_brace) \|\| eof()) {
3120	if (Style.RemoveBracesLLVM)
3121	NestedTooDeep.pop_back();
3122	return;
3123	}
3124	nextToken();
3125	}
3126	if (SeenCatch) {
3127	FormatTok->setFinalizedType(TT_ControlStatementLBrace);
3128	SeenCatch = false;
3129	}
3130	NeedsUnwrappedLine = false;
3131	Line ->MustBeDeclaration = false;
3132	CompoundStatementIndenter Indenter(this, Style, Line ->Level);
3133	parseBlock();
3134	if (Style.BraceWrapping.BeforeCatch)
3135	addUnwrappedLine();
3136	else
3137	NeedsUnwrappedLine = true;
3138	}
3139
3140	if (Style.RemoveBracesLLVM)
3141	NestedTooDeep.pop_back();
3142
3143	if (NeedsUnwrappedLine)
3144	addUnwrappedLine();
3145	}
3146
3147	void UnwrappedLineParser::parseNamespaceOrExportBlock(unsigned AddLevels) {
3148	bool ManageWhitesmithsBraces =
3149	AddLevels == `0u` && Style.BreakBeforeBraces == FormatStyle::BS_Whitesmiths;
3150
3151	// If we're in Whitesmiths mode, indent the brace if we're not indenting
3152	// the whole block.
3153	if (ManageWhitesmithsBraces)
3154	++Line ->Level;
3155
3156	// Munch the semicolon after the block. This is more common than one would
3157	// think. Putting the semicolon into its own line is very ugly.
3158	parseBlock(/MustBeDeclaration=/true, AddLevels, /MunchSemi=/true,
3159	/KeepBraces=/true, /IfKind=/nullptr, UnindentWhitesmithsBraces: ManageWhitesmithsBraces);
3160
3161	addUnwrappedLine(AdjustLevel: AddLevels > `0` ? LineLevel::Remove : LineLevel::Keep);
3162
3163	if (ManageWhitesmithsBraces)
3164	--Line ->Level;
3165	}
3166
3167	void UnwrappedLineParser::parseNamespace() {
3168	assert(FormatTok->isOneOf(tok::kw_namespace, TT_NamespaceMacro) &&
3169	"'namespace' expected");
3170
3171	const FormatToken &InitialToken = *FormatTok;
3172	nextToken();
3173	if (InitialToken.is(TT: TT_NamespaceMacro)) {
3174	parseParens();
3175	} else {
3176	while (FormatTok->isOneOf(K1: tok::identifier, K2: tok::coloncolon, Ks: tok::kw_inline,
3177	Ks: tok::l_square, Ks: tok::period, Ks: tok::l_paren) \|\|
3178	(Style.isCSharp() && FormatTok->is(Kind: tok::kw_union))) {
3179	if (FormatTok->is(Kind: tok::l_square))
3180	parseSquare();
3181	else if (FormatTok->is(Kind: tok::l_paren))
3182	parseParens();
3183	else
3184	nextToken();
3185	}
3186	}
3187	if (FormatTok->is(Kind: tok::l_brace)) {
3188	FormatTok->setFinalizedType(TT_NamespaceLBrace);
3189
3190	if (ShouldBreakBeforeBrace(Style, InitialToken))
3191	addUnwrappedLine();
3192
3193	unsigned AddLevels =
3194	Style.NamespaceIndentation == FormatStyle::NI_All \|\|
3195	(Style.NamespaceIndentation == FormatStyle::NI_Inner &&
3196	DeclarationScopeStack.size() > `1`)
3197	? `1u`
3198	: `0u`;
3199	parseNamespaceOrExportBlock(AddLevels);
3200	}
3201	// FIXME: Add error handling.
3202	}
3203
3204	void UnwrappedLineParser::parseCppExportBlock() {
3205	parseNamespaceOrExportBlock(/AddLevels=/Style.IndentExportBlock ? `1` : `0`);
3206	}
3207
3208	void UnwrappedLineParser::parseNew() {
3209	assert(FormatTok->is(tok::kw_new) && "'new' expected");
3210	nextToken();
3211
3212	if (Style.isCSharp()) {
3213	do {
3214	// Handle constructor invocation, e.g. `new(field: value)`.
3215	if (FormatTok->is(Kind: tok::l_paren))
3216	parseParens();
3217
3218	// Handle array initialization syntax, e.g. `new[] {10, 20, 30}`.
3219	if (FormatTok->is(Kind: tok::l_brace))
3220	parseBracedList();
3221
3222	if (FormatTok->isOneOf(K1: tok::semi, K2: tok::comma))
3223	return;
3224
3225	nextToken();
3226	} while (!eof());
3227	}
3228
3229	if (!Style.isJava())
3230	return;
3231
3232	// In Java, we can parse everything up to the parens, which aren't optional.
3233	do {
3234	// There should not be a ;, { or } before the new's open paren.
3235	if (FormatTok->isOneOf(K1: tok::semi, K2: tok::l_brace, Ks: tok::r_brace))
3236	return;
3237
3238	// Consume the parens.
3239	if (FormatTok->is(Kind: tok::l_paren)) {
3240	parseParens();
3241
3242	// If there is a class body of an anonymous class, consume that as child.
3243	if (FormatTok->is(Kind: tok::l_brace))
3244	parseChildBlock();
3245	return;
3246	}
3247	nextToken();
3248	} while (!eof());
3249	}
3250
3251	void UnwrappedLineParser::parseLoopBody(bool KeepBraces, bool WrapRightBrace) {
3252	keepAncestorBraces();
3253
3254	if (isBlockBegin(Tok: *FormatTok)) {
3255	FormatTok->setFinalizedType(TT_ControlStatementLBrace);
3256	FormatToken *LeftBrace = FormatTok;
3257	CompoundStatementIndenter Indenter(this, Style, Line ->Level);
3258	parseBlock(/MustBeDeclaration=/false, /AddLevels=/`1u`,
3259	/MunchSemi=/true, KeepBraces);
3260	setPreviousRBraceType(TT_ControlStatementRBrace);
3261	if (!KeepBraces) {
3262	assert(!NestedTooDeep.empty());
3263	if (!NestedTooDeep.back())
3264	markOptionalBraces(LeftBrace);
3265	}
3266	if (WrapRightBrace)
3267	addUnwrappedLine();
3268	} else {
3269	parseUnbracedBody();
3270	}
3271
3272	if (!KeepBraces)
3273	NestedTooDeep.pop_back();
3274	}
3275
3276	void UnwrappedLineParser::parseForOrWhileLoop(bool HasParens) {
3277	assert((FormatTok->isOneOf(tok::kw_for, tok::kw_while, TT_ForEachMacro) \|\|
3278	(Style.isVerilog() &&
3279	FormatTok->isOneOf(Keywords.kw_always, Keywords.kw_always_comb,
3280	Keywords.kw_always_ff, Keywords.kw_always_latch,
3281	Keywords.kw_final, Keywords.kw_initial,
3282	Keywords.kw_foreach, Keywords.kw_forever,
3283	Keywords.kw_repeat))) &&
3284	"'for', 'while' or foreach macro expected");
3285	const bool KeepBraces = !Style.RemoveBracesLLVM \|\|
3286	!FormatTok->isOneOf(K1: tok::kw_for, K2: tok::kw_while);
3287
3288	nextToken();
3289	// JS' for await ( ...
3290	if (Style.isJavaScript() && FormatTok->is(II: Keywords.kw_await))
3291	nextToken();
3292	if (IsCpp && FormatTok->is(Kind: tok::kw_co_await))
3293	nextToken();
3294	if (HasParens && FormatTok->is(Kind: tok::l_paren)) {
3295	// The type is only set for Verilog basically because we were afraid to
3296	// change the existing behavior for loops. See the discussion on D121756 for
3297	// details.
3298	if (Style.isVerilog())
3299	FormatTok->setFinalizedType(TT_ConditionLParen);
3300	parseParens();
3301	}
3302
3303	if (Style.isVerilog()) {
3304	// Event control.
3305	parseVerilogSensitivityList();
3306	} else if (Style.AllowShortLoopsOnASingleLine && FormatTok->is(Kind: tok::semi) &&
3307	Tokens->getPreviousToken()->is(Kind: tok::r_paren)) {
3308	nextToken();
3309	addUnwrappedLine();
3310	return;
3311	}
3312
3313	handleAttributes();
3314	parseLoopBody(KeepBraces, /WrapRightBrace=/true);
3315	}
3316
3317	void UnwrappedLineParser::parseDoWhile() {
3318	assert(FormatTok->is(tok::kw_do) && "'do' expected");
3319	nextToken();
3320
3321	parseLoopBody(/KeepBraces=/true, WrapRightBrace: Style.BraceWrapping.BeforeWhile);
3322
3323	// FIXME: Add error handling.
3324	if (FormatTok->isNot(Kind: tok::kw_while)) {
3325	addUnwrappedLine();
3326	return;
3327	}
3328
3329	FormatTok->setFinalizedType(TT_DoWhile);
3330
3331	// If in Whitesmiths mode, the line with the while() needs to be indented
3332	// to the same level as the block.
3333	if (Style.BreakBeforeBraces == FormatStyle::BS_Whitesmiths)
3334	++Line ->Level;
3335
3336	nextToken();
3337	parseStructuralElement();
3338	}
3339
3340	void UnwrappedLineParser::parseLabel(bool LeftAlignLabel) {
3341	nextToken();
3342	unsigned OldLineLevel = Line ->Level;
3343
3344	if (LeftAlignLabel)
3345	Line ->Level = `0`;
3346	else if (Line ->Level > `1` \|\| (!Line ->InPPDirective && Line ->Level > `0`))
3347	--Line ->Level;
3348
3349	if (!Style.IndentCaseBlocks && CommentsBeforeNextToken.empty() &&
3350	FormatTok->is(Kind: tok::l_brace)) {
3351
3352	CompoundStatementIndenter Indenter(this, Line ->Level,
3353	Style.BraceWrapping.AfterCaseLabel,
3354	Style.BraceWrapping.IndentBraces);
3355	parseBlock();
3356	if (FormatTok->is(Kind: tok::kw_break)) {
3357	if (Style.BraceWrapping.AfterControlStatement ==
3358	FormatStyle::BWACS_Always) {
3359	addUnwrappedLine();
3360	if (!Style.IndentCaseBlocks &&
3361	Style.BreakBeforeBraces == FormatStyle::BS_Whitesmiths) {
3362	++Line ->Level;
3363	}
3364	}
3365	parseStructuralElement();
3366	}
3367	addUnwrappedLine();
3368	} else {
3369	if (FormatTok->is(Kind: tok::semi))
3370	nextToken();
3371	addUnwrappedLine();
3372	}
3373	Line ->Level = OldLineLevel;
3374	if (FormatTok->isNot(Kind: tok::l_brace)) {
3375	parseStructuralElement();
3376	addUnwrappedLine();
3377	}
3378	}
3379
3380	void UnwrappedLineParser::parseCaseLabel() {
3381	assert(FormatTok->is(tok::kw_case) && "'case' expected");
3382	auto *Case = FormatTok;
3383
3384	// FIXME: fix handling of complex expressions here.
3385	do {
3386	nextToken();
3387	if (FormatTok->is(Kind: tok::colon)) {
3388	FormatTok->setFinalizedType(TT_CaseLabelColon);
3389	break;
3390	}
3391	if (Style.isJava() && FormatTok->is(Kind: tok::arrow)) {
3392	FormatTok->setFinalizedType(TT_CaseLabelArrow);
3393	Case->setFinalizedType(TT_SwitchExpressionLabel);
3394	break;
3395	}
3396	} while (!eof());
3397	parseLabel();
3398	}
3399
3400	void UnwrappedLineParser::parseSwitch(bool IsExpr) {
3401	assert(FormatTok->is(tok::kw_switch) && "'switch' expected");
3402	nextToken();
3403	if (FormatTok->is(Kind: tok::l_paren))
3404	parseParens();
3405
3406	keepAncestorBraces();
3407
3408	if (FormatTok->is(Kind: tok::l_brace)) {
3409	CompoundStatementIndenter Indenter(this, Style, Line ->Level);
3410	FormatTok->setFinalizedType(IsExpr ? TT_SwitchExpressionLBrace
3411	: TT_ControlStatementLBrace);
3412	if (IsExpr)
3413	parseChildBlock();
3414	else
3415	parseBlock();
3416	setPreviousRBraceType(TT_ControlStatementRBrace);
3417	if (!IsExpr)
3418	addUnwrappedLine();
3419	} else {
3420	addUnwrappedLine();
3421	++Line ->Level;
3422	parseStructuralElement();
3423	--Line ->Level;
3424	}
3425
3426	if (Style.RemoveBracesLLVM)
3427	NestedTooDeep.pop_back();
3428	}
3429
3430	void UnwrappedLineParser::parseAccessSpecifier() {
3431	nextToken();
3432	// Understand Qt's slots.
3433	if (FormatTok->isOneOf(K1: Keywords.kw_slots, K2: Keywords.kw_qslots))
3434	nextToken();
3435	// Otherwise, we don't know what it is, and we'd better keep the next token.
3436	if (FormatTok->is(Kind: tok::colon))
3437	nextToken();
3438	addUnwrappedLine();
3439	}
3440
3441	/// Parses a requires, decides if it is a clause or an expression.
3442	/// \pre The current token has to be the requires keyword.
3443	/// \returns true if it parsed a clause.
3444	bool UnwrappedLineParser::parseRequires(bool SeenEqual) {
3445	assert(FormatTok->is(tok::kw_requires) && "'requires' expected");
3446	auto RequiresToken = FormatTok;
3447
3448	// We try to guess if it is a requires clause, or a requires expression. For
3449	// that we first consume the keyword and check the next token.
3450	nextToken();
3451
3452	switch (FormatTok->Tok.getKind()) {
3453	case tok::l_brace:
3454	// This can only be an expression, never a clause.
3455	parseRequiresExpression(RequiresToken);
3456	return false;
3457	case tok::l_paren:
3458	// Clauses and expression can start with a paren, it's unclear what we have.
3459	break;
3460	default:
3461	// All other tokens can only be a clause.
3462	parseRequiresClause(RequiresToken);
3463	return true;
3464	}
3465
3466	// Looking forward we would have to decide if there are function declaration
3467	// like arguments to the requires expression:
3468	// requires (T t) {
3469	// Or there is a constraint expression for the requires clause:
3470	// requires (C<T> && ...
3471
3472	// But first let's look behind.
3473	auto *PreviousNonComment = RequiresToken->getPreviousNonComment();
3474
3475	if (!PreviousNonComment \|\|
3476	PreviousNonComment->is(TT: TT_RequiresExpressionLBrace)) {
3477	// If there is no token, or an expression left brace, we are a requires
3478	// clause within a requires expression.
3479	parseRequiresClause(RequiresToken);
3480	return true;
3481	}
3482
3483	switch (PreviousNonComment->Tok.getKind()) {
3484	case tok::greater:
3485	case tok::r_paren:
3486	case tok::kw_noexcept:
3487	case tok::kw_const:
3488	case tok::star:
3489	case tok::amp:
3490	// This is a requires clause.
3491	parseRequiresClause(RequiresToken);
3492	return true;
3493	case tok::ampamp: {
3494	// This can be either:
3495	// if (... && requires (T t) ...)
3496	// Or
3497	// void member(...) && requires (C<T> ...
3498	// We check the one token before that for a const:
3499	// void member(...) const && requires (C<T> ...
3500	auto PrevPrev = PreviousNonComment->getPreviousNonComment();
3501	if ((PrevPrev && PrevPrev->is(Kind: tok::kw_const)) \|\| !SeenEqual) {
3502	parseRequiresClause(RequiresToken);
3503	return true;
3504	}
3505	break;
3506	}
3507	default:
3508	if (PreviousNonComment->isTypeOrIdentifier(LangOpts)) {
3509	// This is a requires clause.
3510	parseRequiresClause(RequiresToken);
3511	return true;
3512	}
3513	// It's an expression.
3514	parseRequiresExpression(RequiresToken);
3515	return false;
3516	}
3517
3518	// Now we look forward and try to check if the paren content is a parameter
3519	// list. The parameters can be cv-qualified and contain references or
3520	// pointers.
3521	// So we want basically to check for TYPE NAME, but TYPE can contain all kinds
3522	// of stuff: typename, const, , &, &&, ::, identifiers.*
3523
3524	unsigned StoredPosition = Tokens->getPosition();
3525	FormatToken *NextToken = Tokens->getNextToken();
3526	int Lookahead = `0`;
3527	auto PeekNext = [&Lookahead, &NextToken, this] {
3528	++Lookahead;
3529	NextToken = Tokens->getNextToken();
3530	};
3531
3532	bool FoundType = false;
3533	bool LastWasColonColon = false;
3534	int OpenAngles = `0`;
3535
3536	for (; Lookahead < `50`; PeekNext ()) {
3537	switch (NextToken->Tok.getKind()) {
3538	case tok::kw_volatile:
3539	case tok::kw_const:
3540	case tok::comma:
3541	if (OpenAngles == `0`) {
3542	FormatTok = Tokens->setPosition(StoredPosition);
3543	parseRequiresExpression(RequiresToken);
3544	return false;
3545	}
3546	break;
3547	case tok::eof:
3548	// Break out of the loop.
3549	Lookahead = `50`;
3550	break;
3551	case tok::coloncolon:
3552	LastWasColonColon = true;
3553	break;
3554	case tok::kw_decltype:
3555	case tok::identifier:
3556	if (FoundType && !LastWasColonColon && OpenAngles == `0`) {
3557	FormatTok = Tokens->setPosition(StoredPosition);
3558	parseRequiresExpression(RequiresToken);
3559	return false;
3560	}
3561	FoundType = true;
3562	LastWasColonColon = false;
3563	break;
3564	case tok::less:
3565	++OpenAngles;
3566	break;
3567	case tok::greater:
3568	--OpenAngles;
3569	break;
3570	default:
3571	if (NextToken->isTypeName(LangOpts)) {
3572	FormatTok = Tokens->setPosition(StoredPosition);
3573	parseRequiresExpression(RequiresToken);
3574	return false;
3575	}
3576	break;
3577	}
3578	}
3579	// This seems to be a complicated expression, just assume it's a clause.
3580	FormatTok = Tokens->setPosition(StoredPosition);
3581	parseRequiresClause(RequiresToken);
3582	return true;
3583	}
3584
3585	/// Parses a requires clause.
3586	/// \param RequiresToken The requires keyword token, which starts this clause.
3587	/// \pre We need to be on the next token after the requires keyword.
3588	/// \sa parseRequiresExpression
3589	///
3590	/// Returns if it either has finished parsing the clause, or it detects, that
3591	/// the clause is incorrect.
3592	void UnwrappedLineParser::parseRequiresClause(FormatToken *RequiresToken) {
3593	assert(FormatTok->getPreviousNonComment() == RequiresToken);
3594	assert(RequiresToken->is(tok::kw_requires) && "'requires' expected");
3595
3596	// If there is no previous token, we are within a requires expression,
3597	// otherwise we will always have the template or function declaration in front
3598	// of it.
3599	bool InRequiresExpression =
3600	!RequiresToken->Previous \|\|
3601	RequiresToken->Previous->is(TT: TT_RequiresExpressionLBrace);
3602
3603	RequiresToken->setFinalizedType(InRequiresExpression
3604	? TT_RequiresClauseInARequiresExpression
3605	: TT_RequiresClause);
3606
3607	// NOTE: parseConstraintExpression is only ever called from this function.
3608	// It could be inlined into here.
3609	parseConstraintExpression();
3610
3611	if (!InRequiresExpression && FormatTok->Previous)
3612	FormatTok->Previous->ClosesRequiresClause = true;
3613	}
3614
3615	/// Parses a requires expression.
3616	/// \param RequiresToken The requires keyword token, which starts this clause.
3617	/// \pre We need to be on the next token after the requires keyword.
3618	/// \sa parseRequiresClause
3619	///
3620	/// Returns if it either has finished parsing the expression, or it detects,
3621	/// that the expression is incorrect.
3622	void UnwrappedLineParser::parseRequiresExpression(FormatToken *RequiresToken) {
3623	assert(FormatTok->getPreviousNonComment() == RequiresToken);
3624	assert(RequiresToken->is(tok::kw_requires) && "'requires' expected");
3625
3626	RequiresToken->setFinalizedType(TT_RequiresExpression);
3627
3628	if (FormatTok->is(Kind: tok::l_paren)) {
3629	FormatTok->setFinalizedType(TT_RequiresExpressionLParen);
3630	parseParens();
3631	}
3632
3633	if (FormatTok->is(Kind: tok::l_brace)) {
3634	FormatTok->setFinalizedType(TT_RequiresExpressionLBrace);
3635	parseChildBlock();
3636	}
3637	}
3638
3639	/// Parses a constraint expression.
3640	///
3641	/// This is the body of a requires clause. It returns, when the parsing is
3642	/// complete, or the expression is incorrect.
3643	void UnwrappedLineParser::parseConstraintExpression() {
3644	// The special handling for lambdas is needed since tryToParseLambda() eats a
3645	// token and if a requires expression is the last part of a requires clause
3646	// and followed by an attribute like [[nodiscard]] the ClosesRequiresClause is
3647	// not set on the correct token. Thus we need to be aware if we even expect a
3648	// lambda to be possible.
3649	// template <typename T> requires requires { ... } [[nodiscard]] ...;
3650	bool LambdaNextTimeAllowed = true;
3651
3652	// Within lambda declarations, it is permitted to put a requires clause after
3653	// its template parameter list, which would place the requires clause right
3654	// before the parentheses of the parameters of the lambda declaration. Thus,
3655	// we track if we expect to see grouping parentheses at all.
3656	// Without this check, `requires foo<T> (T t)` in the below example would be
3657	// seen as the whole requires clause, accidentally eating the parameters of
3658	// the lambda.
3659	// [&]<typename T> requires foo<T> (T t) { ... };
3660	bool TopLevelParensAllowed = true;
3661
3662	do {
3663	bool LambdaThisTimeAllowed = std::exchange(obj&: LambdaNextTimeAllowed, new_val: false);
3664
3665	switch (FormatTok->Tok.getKind()) {
3666	case tok::kw_requires: {
3667	auto RequiresToken = FormatTok;
3668	nextToken();
3669	parseRequiresExpression(RequiresToken);
3670	break;
3671	}
3672
3673	case tok::l_paren:
3674	if (!TopLevelParensAllowed)
3675	return;
3676	parseParens(/AmpAmpTokenType=/TT_BinaryOperator);
3677	TopLevelParensAllowed = false;
3678	break;
3679
3680	case tok::l_square:
3681	if (!LambdaThisTimeAllowed \|\| !tryToParseLambda())
3682	return;
3683	break;
3684
3685	case tok::kw_const:
3686	case tok::semi:
3687	case tok::kw_class:
3688	case tok::kw_struct:
3689	case tok::kw_union:
3690	return;
3691
3692	case tok::l_brace:
3693	// Potential function body.
3694	return;
3695
3696	case tok::ampamp:
3697	case tok::pipepipe:
3698	FormatTok->setFinalizedType(TT_BinaryOperator);
3699	nextToken();
3700	LambdaNextTimeAllowed = true;
3701	TopLevelParensAllowed = true;
3702	break;
3703
3704	case tok::comma:
3705	case tok::comment:
3706	LambdaNextTimeAllowed = LambdaThisTimeAllowed;
3707	nextToken();
3708	break;
3709
3710	case tok::kw_sizeof:
3711	case tok::greater:
3712	case tok::greaterequal:
3713	case tok::greatergreater:
3714	case tok::less:
3715	case tok::lessequal:
3716	case tok::lessless:
3717	case tok::equalequal:
3718	case tok::exclaim:
3719	case tok::exclaimequal:
3720	case tok::plus:
3721	case tok::minus:
3722	case tok::star:
3723	case tok::slash:
3724	LambdaNextTimeAllowed = true;
3725	TopLevelParensAllowed = true;
3726	// Just eat them.
3727	nextToken();
3728	break;
3729
3730	case tok::numeric_constant:
3731	case tok::coloncolon:
3732	case tok::kw_true:
3733	case tok::kw_false:
3734	TopLevelParensAllowed = false;
3735	// Just eat them.
3736	nextToken();
3737	break;
3738
3739	case tok::kw_static_cast:
3740	case tok::kw_const_cast:
3741	case tok::kw_reinterpret_cast:
3742	case tok::kw_dynamic_cast:
3743	nextToken();
3744	if (FormatTok->isNot(Kind: tok::less))
3745	return;
3746
3747	nextToken();
3748	parseBracedList(/IsAngleBracket=/true);
3749	break;
3750
3751	default:
3752	if (!FormatTok->Tok.getIdentifierInfo()) {
3753	// Identifiers are part of the default case, we check for more then
3754	// tok::identifier to handle builtin type traits.
3755	return;
3756	}
3757
3758	// We need to differentiate identifiers for a template deduction guide,
3759	// variables, or function return types (the constraint expression has
3760	// ended before that), and basically all other cases. But it's easier to
3761	// check the other way around.
3762	assert(FormatTok->Previous);
3763	switch (FormatTok->Previous->Tok.getKind()) {
3764	case tok::coloncolon: // Nested identifier.
3765	case tok::ampamp: // Start of a function or variable for the
3766	case tok::pipepipe: // constraint expression. (binary)
3767	case tok::exclaim: // The same as above, but unary.
3768	case tok::kw_requires: // Initial identifier of a requires clause.
3769	case tok::equal: // Initial identifier of a concept declaration.
3770	break;
3771	default:
3772	return;
3773	}
3774
3775	// Read identifier with optional template declaration.
3776	nextToken();
3777	if (FormatTok->is(Kind: tok::less)) {
3778	nextToken();
3779	parseBracedList(/IsAngleBracket=/true);
3780	}
3781	TopLevelParensAllowed = false;
3782	break;
3783	}
3784	} while (!eof());
3785	}
3786
3787	bool UnwrappedLineParser::parseEnum() {
3788	const FormatToken &InitialToken = *FormatTok;
3789
3790	// Won't be 'enum' for NS_ENUMs.
3791	if (FormatTok->is(Kind: tok::kw_enum))
3792	nextToken();
3793
3794	// In TypeScript, "enum" can also be used as property name, e.g. in interface
3795	// declarations. An "enum" keyword followed by a colon would be a syntax
3796	// error and thus assume it is just an identifier.
3797	if (Style.isJavaScript() && FormatTok->isOneOf(K1: tok::colon, K2: tok::question))
3798	return false;
3799
3800	// In protobuf, "enum" can be used as a field name.
3801	if (Style.Language == FormatStyle::LK_Proto && FormatTok->is(Kind: tok::equal))
3802	return false;
3803
3804	if (IsCpp) {
3805	// Eat up enum class ...
3806	if (FormatTok->isOneOf(K1: tok::kw_class, K2: tok::kw_struct))
3807	nextToken();
3808	while (FormatTok->is(Kind: tok::l_square))
3809	if (!handleCppAttributes())
3810	return false;
3811	}
3812
3813	while (FormatTok->Tok.getIdentifierInfo() \|\|
3814	FormatTok->isOneOf(K1: tok::colon, K2: tok::coloncolon, Ks: tok::less,
3815	Ks: tok::greater, Ks: tok::comma, Ks: tok::question,
3816	Ks: tok::l_square)) {
3817	if (Style.isVerilog()) {
3818	FormatTok->setFinalizedType(TT_VerilogDimensionedTypeName);
3819	nextToken();
3820	// In Verilog the base type can have dimensions.
3821	while (FormatTok->is(Kind: tok::l_square))
3822	parseSquare();
3823	} else {
3824	nextToken();
3825	}
3826	// We can have macros or attributes in between 'enum' and the enum name.
3827	if (FormatTok->is(Kind: tok::l_paren))
3828	parseParens();
3829	if (FormatTok->is(Kind: tok::identifier)) {
3830	nextToken();
3831	// If there are two identifiers in a row, this is likely an elaborate
3832	// return type. In Java, this can be "implements", etc.
3833	if (IsCpp && FormatTok->is(Kind: tok::identifier))
3834	return false;
3835	}
3836	}
3837
3838	// Just a declaration or something is wrong.
3839	if (FormatTok->isNot(Kind: tok::l_brace))
3840	return true;
3841	FormatTok->setFinalizedType(TT_EnumLBrace);
3842	FormatTok->setBlockKind(BK_Block);
3843
3844	if (Style.isJava()) {
3845	// Java enums are different.
3846	parseJavaEnumBody();
3847	return true;
3848	}
3849	if (Style.Language == FormatStyle::LK_Proto) {
3850	parseBlock(/MustBeDeclaration=/true);
3851	return true;
3852	}
3853
3854	if (!Style.AllowShortEnumsOnASingleLine &&
3855	ShouldBreakBeforeBrace(Style, InitialToken)) {
3856	addUnwrappedLine();
3857	}
3858	// Parse enum body.
3859	nextToken();
3860	if (!Style.AllowShortEnumsOnASingleLine) {
3861	addUnwrappedLine();
3862	Line ->Level += `1`;
3863	}
3864	bool HasError = !parseBracedList(/IsAngleBracket=/false, /IsEnum=/true);
3865	if (!Style.AllowShortEnumsOnASingleLine)
3866	Line ->Level -= `1`;
3867	if (HasError) {
3868	if (FormatTok->is(Kind: tok::semi))
3869	nextToken();
3870	addUnwrappedLine();
3871	}
3872	setPreviousRBraceType(TT_EnumRBrace);
3873	return true;
3874
3875	// There is no addUnwrappedLine() here so that we fall through to parsing a
3876	// structural element afterwards. Thus, in "enum A {} n, m;",
3877	// "} n, m;" will end up in one unwrapped line.
3878	}
3879
3880	bool UnwrappedLineParser::parseStructLike() {
3881	// parseRecord falls through and does not yet add an unwrapped line as a
3882	// record declaration or definition can start a structural element.
3883	parseRecord();
3884	// This does not apply to Java, JavaScript and C#.
3885	if (Style.isJava() \|\| Style.isJavaScript() \|\| Style.isCSharp()) {
3886	if (FormatTok->is(Kind: tok::semi))
3887	nextToken();
3888	addUnwrappedLine();
3889	return true;
3890	}
3891	return false;
3892	}
3893
3894	namespace {
3895	// A class used to set and restore the Token position when peeking
3896	// ahead in the token source.
3897	class ScopedTokenPosition {
3898	unsigned StoredPosition;
3899	FormatTokenSource *Tokens;
3900
3901	public:
3902	ScopedTokenPosition(FormatTokenSource *Tokens) : Tokens(Tokens) {
3903	assert(Tokens && "Tokens expected to not be null");
3904	StoredPosition = Tokens->getPosition();
3905	}
3906
3907	~ScopedTokenPosition() { Tokens->setPosition(StoredPosition); }
3908	};
3909	} // namespace
3910
3911	// Look to see if we have [[ by looking ahead, if
3912	// its not then rewind to the original position.
3913	bool UnwrappedLineParser::tryToParseSimpleAttribute() {
3914	ScopedTokenPosition AutoPosition(Tokens);
3915	FormatToken *Tok = Tokens->getNextToken();
3916	// We already read the first [ check for the second.
3917	if (Tok->isNot(Kind: tok::l_square))
3918	return false;
3919	// Double check that the attribute is just something
3920	// fairly simple.
3921	while (Tok->isNot(Kind: tok::eof)) {
3922	if (Tok->is(Kind: tok::r_square))
3923	break;
3924	Tok = Tokens->getNextToken();
3925	}
3926	if (Tok->is(Kind: tok::eof))
3927	return false;
3928	Tok = Tokens->getNextToken();
3929	if (Tok->isNot(Kind: tok::r_square))
3930	return false;
3931	Tok = Tokens->getNextToken();
3932	if (Tok->is(Kind: tok::semi))
3933	return false;
3934	return true;
3935	}
3936
3937	void UnwrappedLineParser::parseJavaEnumBody() {
3938	assert(FormatTok->is(tok::l_brace));
3939	const FormatToken *OpeningBrace = FormatTok;
3940
3941	// Determine whether the enum is simple, i.e. does not have a semicolon or
3942	// constants with class bodies. Simple enums can be formatted like braced
3943	// lists, contracted to a single line, etc.
3944	unsigned StoredPosition = Tokens->getPosition();
3945	bool IsSimple = true;
3946	FormatToken *Tok = Tokens->getNextToken();
3947	while (Tok->isNot(Kind: tok::eof)) {
3948	if (Tok->is(Kind: tok::r_brace))
3949	break;
3950	if (Tok->isOneOf(K1: tok::l_brace, K2: tok::semi)) {
3951	IsSimple = false;
3952	break;
3953	}
3954	// FIXME: This will also mark enums with braces in the arguments to enum
3955	// constants as "not simple". This is probably fine in practice, though.
3956	Tok = Tokens->getNextToken();
3957	}
3958	FormatTok = Tokens->setPosition(StoredPosition);
3959
3960	if (IsSimple) {
3961	nextToken();
3962	parseBracedList();
3963	addUnwrappedLine();
3964	return;
3965	}
3966
3967	// Parse the body of a more complex enum.
3968	// First add a line for everything up to the "{".
3969	nextToken();
3970	addUnwrappedLine();
3971	++Line ->Level;
3972
3973	// Parse the enum constants.
3974	while (!eof()) {
3975	if (FormatTok->is(Kind: tok::l_brace)) {
3976	// Parse the constant's class body.
3977	parseBlock(/MustBeDeclaration=/true, /AddLevels=/`1u`,
3978	/MunchSemi=/false);
3979	} else if (FormatTok->is(Kind: tok::l_paren)) {
3980	parseParens();
3981	} else if (FormatTok->is(Kind: tok::comma)) {
3982	nextToken();
3983	addUnwrappedLine();
3984	} else if (FormatTok->is(Kind: tok::semi)) {
3985	nextToken();
3986	addUnwrappedLine();
3987	break;
3988	} else if (FormatTok->is(Kind: tok::r_brace)) {
3989	addUnwrappedLine();
3990	break;
3991	} else {
3992	nextToken();
3993	}
3994	}
3995
3996	// Parse the class body after the enum's ";" if any.
3997	parseLevel(OpeningBrace);
3998	nextToken();
3999	--Line ->Level;
4000	addUnwrappedLine();
4001	}
4002
4003	void UnwrappedLineParser::parseRecord(bool ParseAsExpr, bool IsJavaRecord) {
4004	assert(!IsJavaRecord \|\| FormatTok->is(Keywords.kw_record));
4005	const FormatToken &InitialToken = *FormatTok;
4006	nextToken();
4007
4008	FormatToken *ClassName =
4009	IsJavaRecord && FormatTok->is(Kind: tok::identifier) ? FormatTok : nullptr;
4010	bool IsDerived = false;
4011	auto IsNonMacroIdentifier = [](const FormatToken *Tok) {
4012	return Tok->is(Kind: tok::identifier) && Tok->TokenText != Tok->TokenText.upper();
4013	};
4014	// JavaScript/TypeScript supports anonymous classes like:
4015	// a = class extends foo { }
4016	bool JSPastExtendsOrImplements = false;
4017	// The actual identifier can be a nested name specifier, and in macros
4018	// it is often token-pasted.
4019	// An [[attribute]] can be before the identifier.
4020	while (FormatTok->isOneOf(K1: tok::identifier, K2: tok::coloncolon, Ks: tok::hashhash,
4021	Ks: tok::kw_alignas, Ks: tok::l_square) \|\|
4022	FormatTok->isAttribute() \|\|
4023	((Style.isJava() \|\| Style.isJavaScript()) &&
4024	FormatTok->isOneOf(K1: tok::period, K2: tok::comma))) {
4025	if (Style.isJavaScript() &&
4026	FormatTok->isOneOf(K1: Keywords.kw_extends, K2: Keywords.kw_implements)) {
4027	JSPastExtendsOrImplements = true;
4028	// JavaScript/TypeScript supports inline object types in
4029	// extends/implements positions:
4030	// class Foo implements {bar: number} { }
4031	nextToken();
4032	if (FormatTok->is(Kind: tok::l_brace)) {
4033	tryToParseBracedList();
4034	continue;
4035	}
4036	}
4037	if (FormatTok->is(Kind: tok::l_square) && handleCppAttributes())
4038	continue;
4039	auto *Previous = FormatTok;
4040	nextToken();
4041	switch (FormatTok->Tok.getKind()) {
4042	case tok::l_paren:
4043	// We can have macros in between 'class' and the class name.
4044	if (IsJavaRecord \|\| !IsNonMacroIdentifier (Previous) \|\|
4045	// e.g. `struct macro(a) S { int i; };`
4046	Previous->Previous == &InitialToken) {
4047	parseParens();
4048	}
4049	break;
4050	case tok::coloncolon:
4051	case tok::hashhash:
4052	break;
4053	default:
4054	if (JSPastExtendsOrImplements \|\| ClassName \|\|
4055	Previous->isNot(Kind: tok::identifier) \|\| Previous->is(TT: TT_AttributeMacro)) {
4056	break;
4057	}
4058	if (const auto Text = Previous->TokenText;
4059	Text.size() == `1` \|\| Text != Text.upper()) {
4060	ClassName = Previous;
4061	}
4062	}
4063	}
4064
4065	auto IsListInitialization = [&] {
4066	if (!ClassName \|\| IsDerived \|\| JSPastExtendsOrImplements)
4067	return false;
4068	assert(FormatTok->is(tok::l_brace));
4069	const auto *Prev = FormatTok->getPreviousNonComment();
4070	assert(Prev);
4071	return Prev != ClassName && Prev->is(Kind: tok::identifier) &&
4072	Prev->isNot(Kind: Keywords.kw_final) && tryToParseBracedList();
4073	};
4074
4075	if (FormatTok->isOneOf(K1: tok::colon, K2: tok::less)) {
4076	int AngleNestingLevel = `0`;
4077	do {
4078	if (FormatTok->is(Kind: tok::less))
4079	++AngleNestingLevel;
4080	else if (FormatTok->is(Kind: tok::greater))
4081	--AngleNestingLevel;
4082
4083	if (AngleNestingLevel == `0`) {
4084	if (FormatTok->is(Kind: tok::colon)) {
4085	IsDerived = true;
4086	} else if (!IsDerived && FormatTok->is(Kind: tok::identifier) &&
4087	FormatTok->Previous->is(Kind: tok::coloncolon)) {
4088	ClassName = FormatTok;
4089	} else if (FormatTok->is(Kind: tok::l_paren) &&
4090	IsNonMacroIdentifier (FormatTok->Previous)) {
4091	break;
4092	}
4093	}
4094	if (FormatTok->is(Kind: tok::l_brace)) {
4095	if (AngleNestingLevel == `0` && IsListInitialization ())
4096	return;
4097	calculateBraceTypes(/ExpectClassBody=/true);
4098	if (!tryToParseBracedList())
4099	break;
4100	}
4101	if (FormatTok->is(Kind: tok::l_square)) {
4102	FormatToken *Previous = FormatTok->Previous;
4103	if (!Previous \|\| (Previous->isNot(Kind: tok::r_paren) &&
4104	!Previous->isTypeOrIdentifier(LangOpts))) {
4105	// Don't try parsing a lambda if we had a closing parenthesis before,
4106	// it was probably a pointer to an array: int ()[].*
4107	if (!tryToParseLambda())
4108	continue;
4109	} else {
4110	parseSquare();
4111	continue;
4112	}
4113	}
4114	if (FormatTok->is(Kind: tok::semi))
4115	return;
4116	if (Style.isCSharp() && FormatTok->is(II: Keywords.kw_where)) {
4117	addUnwrappedLine();
4118	nextToken();
4119	parseCSharpGenericTypeConstraint();
4120	break;
4121	}
4122	nextToken();
4123	} while (!eof());
4124	}
4125
4126	auto GetBraceTypes =
4127	[](const FormatToken &RecordTok) -> std::pair<TokenType, TokenType> {
4128	switch (RecordTok.Tok.getKind()) {
4129	case tok::kw_class:
4130	return {TT_ClassLBrace, TT_ClassRBrace};
4131	case tok::kw_struct:
4132	return {TT_StructLBrace, TT_StructRBrace};
4133	case tok::kw_union:
4134	return {TT_UnionLBrace, TT_UnionRBrace};
4135	default:
4136	// Useful for e.g. interface.
4137	return {TT_RecordLBrace, TT_RecordRBrace};
4138	}
4139	};
4140	if (FormatTok->is(Kind: tok::l_brace)) {
4141	if (IsListInitialization ())
4142	return;
4143	if (ClassName)
4144	ClassName->setFinalizedType(TT_ClassHeadName);
4145	auto [OpenBraceType, ClosingBraceType] = GetBraceTypes (InitialToken);
4146	FormatTok->setFinalizedType(OpenBraceType);
4147	if (ParseAsExpr) {
4148	parseChildBlock();
4149	} else {
4150	if (ShouldBreakBeforeBrace(Style, InitialToken))
4151	addUnwrappedLine();
4152
4153	unsigned AddLevels = Style.IndentAccessModifiers ? `2u` : `1u`;
4154	parseBlock(/MustBeDeclaration=/true, AddLevels, /MunchSemi=/false);
4155	}
4156	setPreviousRBraceType(ClosingBraceType);
4157	}
4158	// There is no addUnwrappedLine() here so that we fall through to parsing a
4159	// structural element afterwards. Thus, in "class A {} n, m;",
4160	// "} n, m;" will end up in one unwrapped line.
4161	}
4162
4163	void UnwrappedLineParser::parseObjCMethod() {
4164	assert(FormatTok->isOneOf(tok::l_paren, tok::identifier) &&
4165	"'(' or identifier expected.");
4166	do {
4167	if (FormatTok->is(Kind: tok::semi)) {
4168	nextToken();
4169	addUnwrappedLine();
4170	return;
4171	} else if (FormatTok->is(Kind: tok::l_brace)) {
4172	if (Style.BraceWrapping.AfterFunction)
4173	addUnwrappedLine();
4174	parseBlock();
4175	addUnwrappedLine();
4176	return;
4177	} else {
4178	nextToken();
4179	}
4180	} while (!eof());
4181	}
4182
4183	void UnwrappedLineParser::parseObjCProtocolList() {
4184	assert(FormatTok->is(tok::less) && "'<' expected.");
4185	do {
4186	nextToken();
4187	// Early exit in case someone forgot a close angle.
4188	if (FormatTok->isOneOf(K1: tok::semi, K2: tok::l_brace, Ks: tok::objc_end))
4189	return;
4190	} while (!eof() && FormatTok->isNot(Kind: tok::greater));
4191	nextToken(); // Skip '>'.
4192	}
4193
4194	void UnwrappedLineParser::parseObjCUntilAtEnd() {
4195	do {
4196	if (FormatTok->is(Kind: tok::objc_end)) {
4197	nextToken();
4198	addUnwrappedLine();
4199	break;
4200	}
4201	if (FormatTok->is(Kind: tok::l_brace)) {
4202	parseBlock();
4203	// In ObjC interfaces, nothing should be following the "}".
4204	addUnwrappedLine();
4205	} else if (FormatTok->is(Kind: tok::r_brace)) {
4206	// Ignore stray "}". parseStructuralElement doesn't consume them.
4207	nextToken();
4208	addUnwrappedLine();
4209	} else if (FormatTok->isOneOf(K1: tok::minus, K2: tok::plus)) {
4210	nextToken();
4211	parseObjCMethod();
4212	} else {
4213	parseStructuralElement();
4214	}
4215	} while (!eof());
4216	}
4217
4218	void UnwrappedLineParser::parseObjCInterfaceOrImplementation() {
4219	assert(FormatTok->isOneOf(tok::objc_interface, tok::objc_implementation));
4220	nextToken();
4221	nextToken(); // interface name
4222
4223	// @interface can be followed by a lightweight generic
4224	// specialization list, then either a base class or a category.
4225	if (FormatTok->is(Kind: tok::less))
4226	parseObjCLightweightGenerics();
4227	if (FormatTok->is(Kind: tok::colon)) {
4228	nextToken();
4229	nextToken(); // base class name
4230	// The base class can also have lightweight generics applied to it.
4231	if (FormatTok->is(Kind: tok::less))
4232	parseObjCLightweightGenerics();
4233	} else if (FormatTok->is(Kind: tok::l_paren)) {
4234	// Skip category, if present.
4235	parseParens();
4236	}
4237
4238	if (FormatTok->is(Kind: tok::less))
4239	parseObjCProtocolList();
4240
4241	if (FormatTok->is(Kind: tok::l_brace)) {
4242	if (Style.BraceWrapping.AfterObjCDeclaration)
4243	addUnwrappedLine();
4244	parseBlock(/MustBeDeclaration=/true);
4245	}
4246
4247	// With instance variables, this puts '}' on its own line. Without instance
4248	// variables, this ends the @interface line.
4249	addUnwrappedLine();
4250
4251	parseObjCUntilAtEnd();
4252	}
4253
4254	void UnwrappedLineParser::parseObjCLightweightGenerics() {
4255	assert(FormatTok->is(tok::less));
4256	// Unlike protocol lists, generic parameterizations support
4257	// nested angles:
4258	//
4259	// @interface Foo<ValueType : id <NSCopying, NSSecureCoding>> :
4260	// NSObject <NSCopying, NSSecureCoding>
4261	//
4262	// so we need to count how many open angles we have left.
4263	unsigned NumOpenAngles = `1`;
4264	do {
4265	nextToken();
4266	// Early exit in case someone forgot a close angle.
4267	if (FormatTok->isOneOf(K1: tok::semi, K2: tok::l_brace, Ks: tok::objc_end))
4268	break;
4269	if (FormatTok->is(Kind: tok::less)) {
4270	++NumOpenAngles;
4271	} else if (FormatTok->is(Kind: tok::greater)) {
4272	assert(NumOpenAngles > `0` && "'>' makes NumOpenAngles negative");
4273	--NumOpenAngles;
4274	}
4275	} while (!eof() && NumOpenAngles != `0`);
4276	nextToken(); // Skip '>'.
4277	}
4278
4279	// Returns true for the declaration/definition form of @protocol,
4280	// false for the expression form.
4281	bool UnwrappedLineParser::parseObjCProtocol() {
4282	assert(FormatTok->is(tok::objc_protocol));
4283	nextToken();
4284
4285	if (FormatTok->is(Kind: tok::l_paren)) {
4286	// The expression form of @protocol, e.g. "Protocol p = @protocol(foo);".*
4287	return false;
4288	}
4289
4290	// The definition/declaration form,
4291	// @protocol Foo
4292	// - (int)someMethod;
4293	// @end
4294
4295	nextToken(); // protocol name
4296
4297	if (FormatTok->is(Kind: tok::less))
4298	parseObjCProtocolList();
4299
4300	// Check for protocol declaration.
4301	if (FormatTok->is(Kind: tok::semi)) {
4302	nextToken();
4303	addUnwrappedLine();
4304	return true;
4305	}
4306
4307	addUnwrappedLine();
4308	parseObjCUntilAtEnd();
4309	return true;
4310	}
4311
4312	void UnwrappedLineParser::parseJavaScriptEs6ImportExport() {
4313	bool IsImport = FormatTok->is(II: Keywords.kw_import);
4314	assert(IsImport \|\| FormatTok->is(tok::kw_export));
4315	nextToken();
4316
4317	// Consume the "default" in "export default class/function".
4318	if (FormatTok->is(Kind: tok::kw_default))
4319	nextToken();
4320
4321	// Consume "async function", "function" and "default function", so that these
4322	// get parsed as free-standing JS functions, i.e. do not require a trailing
4323	// semicolon.
4324	if (FormatTok->is(II: Keywords.kw_async))
4325	nextToken();
4326	if (FormatTok->is(II: Keywords.kw_function)) {
4327	nextToken();
4328	return;
4329	}
4330
4331	// For imports, `export `, `export {...}`, consume the rest of the line up*
4332	// to the terminating `;`. For everything else, just return and continue
4333	// parsing the structural element, i.e. the declaration or expression for
4334	// `export default`.
4335	if (!IsImport && !FormatTok->isOneOf(K1: tok::l_brace, K2: tok::star) &&
4336	!FormatTok->isStringLiteral() &&
4337	!(FormatTok->is(II: Keywords.kw_type) &&
4338	Tokens->peekNextToken()->isOneOf(K1: tok::l_brace, K2: tok::star))) {
4339	return;
4340	}
4341
4342	while (!eof()) {
4343	if (FormatTok->is(Kind: tok::semi))
4344	return;
4345	if (Line ->Tokens.empty()) {
4346	// Common issue: Automatic Semicolon Insertion wrapped the line, so the
4347	// import statement should terminate.
4348	return;
4349	}
4350	if (FormatTok->is(Kind: tok::l_brace)) {
4351	FormatTok->setBlockKind(BK_Block);
4352	nextToken();
4353	parseBracedList();
4354	} else {
4355	nextToken();
4356	}
4357	}
4358	}
4359
4360	void UnwrappedLineParser::parseStatementMacro() {
4361	nextToken();
4362	if (FormatTok->is(Kind: tok::l_paren))
4363	parseParens();
4364	if (FormatTok->is(Kind: tok::semi))
4365	nextToken();
4366	addUnwrappedLine();
4367	}
4368
4369	void UnwrappedLineParser::parseVerilogHierarchyIdentifier() {
4370	// consume things like a::`b.c[d:e] or a::*
4371	while (true) {
4372	if (FormatTok->isOneOf(K1: tok::star, K2: tok::period, Ks: tok::periodstar,
4373	Ks: tok::coloncolon, Ks: tok::hash) \|\|
4374	Keywords.isVerilogIdentifier(Tok: *FormatTok)) {
4375	nextToken();
4376	} else if (FormatTok->is(Kind: tok::l_square)) {
4377	parseSquare();
4378	} else {
4379	break;
4380	}
4381	}
4382	}
4383
4384	void UnwrappedLineParser::parseVerilogSensitivityList() {
4385	if (FormatTok->isNot(Kind: tok::at))
4386	return;
4387	nextToken();
4388	// A block event expression has 2 at signs.
4389	if (FormatTok->is(Kind: tok::at))
4390	nextToken();
4391	switch (FormatTok->Tok.getKind()) {
4392	case tok::star:
4393	nextToken();
4394	break;
4395	case tok::l_paren:
4396	parseParens();
4397	break;
4398	default:
4399	parseVerilogHierarchyIdentifier();
4400	break;
4401	}
4402	}
4403
4404	unsigned UnwrappedLineParser::parseVerilogHierarchyHeader() {
4405	unsigned AddLevels = `0`;
4406
4407	if (FormatTok->is(II: Keywords.kw_clocking)) {
4408	nextToken();
4409	if (Keywords.isVerilogIdentifier(Tok: *FormatTok))
4410	nextToken();
4411	parseVerilogSensitivityList();
4412	if (FormatTok->is(Kind: tok::semi))
4413	nextToken();
4414	} else if (FormatTok->isOneOf(K1: tok::kw_case, K2: Keywords.kw_casex,
4415	Ks: Keywords.kw_casez, Ks: Keywords.kw_randcase,
4416	Ks: Keywords.kw_randsequence)) {
4417	if (Style.IndentCaseLabels)
4418	AddLevels++;
4419	nextToken();
4420	if (FormatTok->is(Kind: tok::l_paren)) {
4421	FormatTok->setFinalizedType(TT_ConditionLParen);
4422	parseParens();
4423	}
4424	if (FormatTok->isOneOf(K1: Keywords.kw_inside, K2: Keywords.kw_matches))
4425	nextToken();
4426	// The case header has no semicolon.
4427	} else {
4428	// "module" etc.
4429	nextToken();
4430	// all the words like the name of the module and specifiers like
4431	// "automatic" and the width of function return type
4432	while (true) {
4433	if (FormatTok->is(Kind: tok::l_square)) {
4434	auto Prev = FormatTok->getPreviousNonComment();
4435	if (Prev && Keywords.isVerilogIdentifier(Tok: *Prev))
4436	Prev->setFinalizedType(TT_VerilogDimensionedTypeName);
4437	parseSquare();
4438	} else if (Keywords.isVerilogIdentifier(Tok: *FormatTok) \|\|
4439	FormatTok->isOneOf(K1: tok::hash, K2: tok::hashhash, Ks: tok::coloncolon,
4440	Ks: Keywords.kw_automatic, Ks: tok::kw_static)) {
4441	nextToken();
4442	} else {
4443	break;
4444	}
4445	}
4446
4447	auto NewLine = [this]() {
4448	addUnwrappedLine();
4449	Line ->IsContinuation = true;
4450	};
4451
4452	// package imports
4453	while (FormatTok->is(II: Keywords.kw_import)) {
4454	NewLine ();
4455	nextToken();
4456	parseVerilogHierarchyIdentifier();
4457	if (FormatTok->is(Kind: tok::semi))
4458	nextToken();
4459	}
4460
4461	// parameters and ports
4462	if (FormatTok->is(II: Keywords.kw_verilogHash)) {
4463	NewLine ();
4464	nextToken();
4465	if (FormatTok->is(Kind: tok::l_paren)) {
4466	FormatTok->setFinalizedType(TT_VerilogMultiLineListLParen);
4467	parseParens();
4468	}
4469	}
4470	if (FormatTok->is(Kind: tok::l_paren)) {
4471	NewLine ();
4472	FormatTok->setFinalizedType(TT_VerilogMultiLineListLParen);
4473	parseParens();
4474	}
4475
4476	// extends and implements
4477	if (FormatTok->is(II: Keywords.kw_extends)) {
4478	NewLine ();
4479	nextToken();
4480	parseVerilogHierarchyIdentifier();
4481	if (FormatTok->is(Kind: tok::l_paren))
4482	parseParens();
4483	}
4484	if (FormatTok->is(II: Keywords.kw_implements)) {
4485	NewLine ();
4486	do {
4487	nextToken();
4488	parseVerilogHierarchyIdentifier();
4489	} while (FormatTok->is(Kind: tok::comma));
4490	}
4491
4492	// Coverage event for cover groups.
4493	if (FormatTok->is(Kind: tok::at)) {
4494	NewLine ();
4495	parseVerilogSensitivityList();
4496	}
4497
4498	if (FormatTok->is(Kind: tok::semi))
4499	nextToken(/LevelDifference=/`1`);
4500	addUnwrappedLine();
4501	}
4502
4503	return AddLevels;
4504	}
4505
4506	void UnwrappedLineParser::parseVerilogTable() {
4507	assert(FormatTok->is(Keywords.kw_table));
4508	nextToken(/LevelDifference=/`1`);
4509	addUnwrappedLine();
4510
4511	auto InitialLevel = Line ->Level++;
4512	while (!eof() && !Keywords.isVerilogEnd(Tok: *FormatTok)) {
4513	FormatToken *Tok = FormatTok;
4514	nextToken();
4515	if (Tok->is(Kind: tok::semi))
4516	addUnwrappedLine();
4517	else if (Tok->isOneOf(K1: tok::star, K2: tok::colon, Ks: tok::question, Ks: tok::minus))
4518	Tok->setFinalizedType(TT_VerilogTableItem);
4519	}
4520	Line ->Level = InitialLevel;
4521	nextToken(/LevelDifference=/-`1`);
4522	addUnwrappedLine();
4523	}
4524
4525	void UnwrappedLineParser::parseVerilogCaseLabel() {
4526	// The label will get unindented in AnnotatingParser. If there are no leading
4527	// spaces, indent the rest here so that things inside the block will be
4528	// indented relative to things outside. We don't use parseLabel because we
4529	// don't know whether this colon is a label or a ternary expression at this
4530	// point.
4531	auto OrigLevel = Line ->Level;
4532	auto FirstLine = CurrentLines->size();
4533	if (Line ->Level == `0` \|\| (Line ->InPPDirective && Line ->Level <= `1`))
4534	++Line ->Level;
4535	else if (!Style.IndentCaseBlocks && Keywords.isVerilogBegin(Tok: *FormatTok))
4536	--Line ->Level;
4537	parseStructuralElement();
4538	// Restore the indentation in both the new line and the line that has the
4539	// label.
4540	if (CurrentLines->size() > FirstLine)
4541	(*CurrentLines)[FirstLine].Level = OrigLevel;
4542	Line ->Level = OrigLevel;
4543	}
4544
4545	bool UnwrappedLineParser::containsExpansion(const UnwrappedLine &Line) const {
4546	for (const auto &N : Line.Tokens) {
4547	if (N.Tok->MacroCtx)
4548	return true;
4549	for (const UnwrappedLine &Child : N.Children)
4550	if (containsExpansion(Line: Child))
4551	return true;
4552	}
4553	return false;
4554	}
4555
4556	void UnwrappedLineParser::addUnwrappedLine(LineLevel AdjustLevel) {
4557	if (Line ->Tokens.empty())
4558	return;
4559	LLVM_DEBUG({
4560	if (!parsingPPDirective()) {
4561	llvm::dbgs() << "Adding unwrapped line:\n";
4562	printDebugInfo(*Line);
4563	}
4564	});
4565
4566	// If this line closes a block when in Whitesmiths mode, remember that
4567	// information so that the level can be decreased after the line is added.
4568	// This has to happen after the addition of the line since the line itself
4569	// needs to be indented.
4570	bool ClosesWhitesmithsBlock =
4571	Line ->MatchingOpeningBlockLineIndex != UnwrappedLine::kInvalidIndex &&
4572	Style.BreakBeforeBraces == FormatStyle::BS_Whitesmiths;
4573
4574	// If the current line was expanded from a macro call, we use it to
4575	// reconstruct an unwrapped line from the structure of the expanded unwrapped
4576	// line and the unexpanded token stream.
4577	if (!parsingPPDirective() && !InExpansion && containsExpansion(Line: *Line)) {
4578	if (!Reconstruct)
4579	Reconstruct.emplace(args&: Line ->Level, args&: Unexpanded);
4580	Reconstruct ->addLine(Line: *Line);
4581
4582	// While the reconstructed unexpanded lines are stored in the normal
4583	// flow of lines, the expanded lines are stored on the side to be analyzed
4584	// in an extra step.
4585	CurrentExpandedLines.push_back(Elt: std::move(*Line));
4586
4587	if (Reconstruct ->finished()) {
4588	UnwrappedLine Reconstructed = std::move(*Reconstruct).takeResult();
4589	assert(!Reconstructed.Tokens.empty() &&
4590	"Reconstructed must at least contain the macro identifier.");
4591	assert(!parsingPPDirective());
4592	LLVM_DEBUG({
4593	llvm::dbgs() << "Adding unexpanded line:\n";
4594	printDebugInfo(Reconstructed);
4595	});
4596	ExpandedLines [Reconstructed.Tokens.begin()->Tok] = CurrentExpandedLines;
4597	Lines.push_back(Elt: std::move(Reconstructed));
4598	CurrentExpandedLines.clear();
4599	Reconstruct.reset();
4600	}
4601	} else {
4602	// At the top level we only get here when no unexpansion is going on, or
4603	// when conditional formatting led to unfinished macro reconstructions.
4604	assert(!Reconstruct \|\| (CurrentLines != &Lines) \|\| PPStack.size() > `0`);
4605	CurrentLines->push_back(Elt: std::move(*Line));
4606	}
4607	Line ->Tokens.clear();
4608	Line ->MatchingOpeningBlockLineIndex = UnwrappedLine::kInvalidIndex;
4609	Line ->FirstStartColumn = `0`;
4610	Line ->IsContinuation = false;
4611	Line ->SeenDecltypeAuto = false;
4612
4613	if (ClosesWhitesmithsBlock && AdjustLevel == LineLevel::Remove)
4614	--Line ->Level;
4615	if (!parsingPPDirective() && !PreprocessorDirectives.empty()) {
4616	CurrentLines->append(
4617	in_start: std::make_move_iterator(i: PreprocessorDirectives.begin()),
4618	in_end: std::make_move_iterator(i: PreprocessorDirectives.end()));
4619	PreprocessorDirectives.clear();
4620	}
4621	// Disconnect the current token from the last token on the previous line.
4622	FormatTok->Previous = nullptr;
4623	}
4624
4625	bool UnwrappedLineParser::eof() const { return FormatTok->is(Kind: tok::eof); }
4626
4627	bool UnwrappedLineParser::isOnNewLine(const FormatToken &FormatTok) {
4628	return (Line ->InPPDirective \|\| FormatTok.HasUnescapedNewline) &&
4629	FormatTok.NewlinesBefore > `0`;
4630	}
4631
4632	// Checks if \p FormatTok is a line comment that continues the line comment
4633	// section on \p Line.
4634	static bool
4635	continuesLineCommentSection(const FormatToken &FormatTok,
4636	const UnwrappedLine &Line, const FormatStyle &Style,
4637	const llvm::Regex &CommentPragmasRegex) {
4638	if (Line.Tokens.empty() \|\| Style.ReflowComments != FormatStyle::RCS_Always)
4639	return false;
4640
4641	StringRef IndentContent = FormatTok.TokenText;
4642	if (FormatTok.TokenText.starts_with(Prefix: "//") \|\|
4643	FormatTok.TokenText.starts_with(Prefix: "/*")) {
4644	IndentContent = FormatTok.TokenText.substr(Start: `2`);
4645	}
4646	if (CommentPragmasRegex.match(String: IndentContent))
4647	return false;
4648
4649	// If Line starts with a line comment, then FormatTok continues the comment
4650	// section if its original column is greater or equal to the original start
4651	// column of the line.
4652	//
4653	// Define the min column token of a line as follows: if a line ends in '{' or
4654	// contains a '{' followed by a line comment, then the min column token is
4655	// that '{'. Otherwise, the min column token of the line is the first token of
4656	// the line.
4657	//
4658	// If Line starts with a token other than a line comment, then FormatTok
4659	// continues the comment section if its original column is greater than the
4660	// original start column of the min column token of the line.
4661	//
4662	// For example, the second line comment continues the first in these cases:
4663	//
4664	// // first line
4665	// // second line
4666	//
4667	// and:
4668	//
4669	// // first line
4670	// // second line
4671	//
4672	// and:
4673	//
4674	// int i; // first line
4675	// // second line
4676	//
4677	// and:
4678	//
4679	// do { // first line
4680	// // second line
4681	// int i;
4682	// } while (true);
4683	//
4684	// and:
4685	//
4686	// enum {
4687	// a, // first line
4688	// // second line
4689	// b
4690	// };
4691	//
4692	// The second line comment doesn't continue the first in these cases:
4693	//
4694	// // first line
4695	// // second line
4696	//
4697	// and:
4698	//
4699	// int i; // first line
4700	// // second line
4701	//
4702	// and:
4703	//
4704	// do { // first line
4705	// // second line
4706	// int i;
4707	// } while (true);
4708	//
4709	// and:
4710	//
4711	// enum {
4712	// a, // first line
4713	// // second line
4714	// };
4715	const FormatToken *MinColumnToken = Line.Tokens.front().Tok;
4716
4717	// Scan for '{//'. If found, use the column of '{' as a min column for line
4718	// comment section continuation.
4719	const FormatToken PreviousToken = nullptr*;
4720	for (const UnwrappedLineNode &Node : Line.Tokens) {
4721	if (PreviousToken && PreviousToken->is(Kind: tok::l_brace) &&
4722	isLineComment(FormatTok: *Node.Tok)) {
4723	MinColumnToken = PreviousToken;
4724	break;
4725	}
4726	PreviousToken = Node.Tok;
4727
4728	// Grab the last newline preceding a token in this unwrapped line.
4729	if (Node.Tok->NewlinesBefore > `0`)
4730	MinColumnToken = Node.Tok;
4731	}
4732	if (PreviousToken && PreviousToken->is(Kind: tok::l_brace))
4733	MinColumnToken = PreviousToken;
4734
4735	return continuesLineComment(FormatTok, /Previous=/Line.Tokens.back().Tok,
4736	MinColumnToken);
4737	}
4738
4739	void UnwrappedLineParser::flushComments(bool NewlineBeforeNext) {
4740	bool JustComments = Line ->Tokens.empty();
4741	for (FormatToken *Tok : CommentsBeforeNextToken) {
4742	// Line comments that belong to the same line comment section are put on the
4743	// same line since later we might want to reflow content between them.
4744	// Additional fine-grained breaking of line comment sections is controlled
4745	// by the class BreakableLineCommentSection in case it is desirable to keep
4746	// several line comment sections in the same unwrapped line.
4747	//
4748	// FIXME: Consider putting separate line comment sections as children to the
4749	// unwrapped line instead.
4750	Tok->ContinuesLineCommentSection =
4751	continuesLineCommentSection(FormatTok: Tok, Line: Line, Style, CommentPragmasRegex);
4752	if (isOnNewLine(FormatTok: *Tok) && JustComments && !Tok->ContinuesLineCommentSection)
4753	addUnwrappedLine();
4754	pushToken(Tok);
4755	}
4756	if (NewlineBeforeNext && JustComments)
4757	addUnwrappedLine();
4758	CommentsBeforeNextToken.clear();
4759	}
4760
4761	void UnwrappedLineParser::nextToken(int LevelDifference) {
4762	if (eof())
4763	return;
4764	flushComments(NewlineBeforeNext: isOnNewLine(FormatTok: *FormatTok));
4765	pushToken(Tok: FormatTok);
4766	FormatToken *Previous = FormatTok;
4767	if (!Style.isJavaScript())
4768	readToken(LevelDifference);
4769	else
4770	readTokenWithJavaScriptASI();
4771	FormatTok->Previous = Previous;
4772	if (Style.isVerilog()) {
4773	// Blocks in Verilog can have `begin` and `end` instead of braces. For
4774	// keywords like `begin`, we can't treat them the same as left braces
4775	// because some contexts require one of them. For example structs use
4776	// braces and if blocks use keywords, and a left brace can occur in an if
4777	// statement, but it is not a block. For keywords like `end`, we simply
4778	// treat them the same as right braces.
4779	if (Keywords.isVerilogEnd(Tok: *FormatTok))
4780	FormatTok->Tok.setKind(tok::r_brace);
4781	}
4782	}
4783
4784	void UnwrappedLineParser::distributeComments(
4785	const ArrayRef<FormatToken > &Comments, const* FormatToken *NextTok) {
4786	// Whether or not a line comment token continues a line is controlled by
4787	// the method continuesLineCommentSection, with the following caveat:
4788	//
4789	// Define a trail of Comments to be a nonempty proper postfix of Comments such
4790	// that each comment line from the trail is aligned with the next token, if
4791	// the next token exists. If a trail exists, the beginning of the maximal
4792	// trail is marked as a start of a new comment section.
4793	//
4794	// For example in this code:
4795	//
4796	// int a; // line about a
4797	// // line 1 about b
4798	// // line 2 about b
4799	// int b;
4800	//
4801	// the two lines about b form a maximal trail, so there are two sections, the
4802	// first one consisting of the single comment "// line about a" and the
4803	// second one consisting of the next two comments.
4804	if (Comments.empty())
4805	return;
4806	bool ShouldPushCommentsInCurrentLine = true;
4807	bool HasTrailAlignedWithNextToken = false;
4808	unsigned StartOfTrailAlignedWithNextToken = `0`;
4809	if (NextTok) {
4810	// We are skipping the first element intentionally.
4811	for (unsigned i = Comments.size() - `1`; i > `0`; --i) {
4812	if (Comments [i]->OriginalColumn == NextTok->OriginalColumn) {
4813	HasTrailAlignedWithNextToken = true;
4814	StartOfTrailAlignedWithNextToken = i;
4815	}
4816	}
4817	}
4818	for (unsigned i = `0`, e = Comments.size(); i < e; ++i) {
4819	FormatToken *FormatTok = Comments [i];
4820	if (HasTrailAlignedWithNextToken && i == StartOfTrailAlignedWithNextToken) {
4821	FormatTok->ContinuesLineCommentSection = false;
4822	} else {
4823	FormatTok->ContinuesLineCommentSection = continuesLineCommentSection(
4824	FormatTok: FormatTok, Line: Line, Style, CommentPragmasRegex);
4825	}
4826	if (!FormatTok->ContinuesLineCommentSection &&
4827	(isOnNewLine(FormatTok: *FormatTok) \|\| FormatTok->IsFirst)) {
4828	ShouldPushCommentsInCurrentLine = false;
4829	}
4830	if (ShouldPushCommentsInCurrentLine)
4831	pushToken(Tok: FormatTok);
4832	else
4833	CommentsBeforeNextToken.push_back(Elt: FormatTok);
4834	}
4835	}
4836
4837	void UnwrappedLineParser::readToken(int LevelDifference) {
4838	SmallVector<FormatToken *, `1`> Comments;
4839	bool PreviousWasComment = false;
4840	bool FirstNonCommentOnLine = false;
4841	do {
4842	FormatTok = Tokens->getNextToken();
4843	assert(FormatTok);
4844	while (FormatTok->isOneOf(K1: TT_ConflictStart, K2: TT_ConflictEnd,
4845	Ks: TT_ConflictAlternative)) {
4846	if (FormatTok->is(TT: TT_ConflictStart))
4847	conditionalCompilationStart(/Unreachable=/false);
4848	else if (FormatTok->is(TT: TT_ConflictAlternative))
4849	conditionalCompilationAlternative();
4850	else if (FormatTok->is(TT: TT_ConflictEnd))
4851	conditionalCompilationEnd();
4852	FormatTok = Tokens->getNextToken();
4853	FormatTok->MustBreakBefore = true;
4854	FormatTok->MustBreakBeforeFinalized = true;
4855	}
4856
4857	auto IsFirstNonCommentOnLine = [](bool FirstNonCommentOnLine,
4858	const FormatToken &Tok,
4859	bool PreviousWasComment) {
4860	auto IsFirstOnLine = [](const FormatToken &Tok) {
4861	return Tok.HasUnescapedNewline \|\| Tok.IsFirst;
4862	};
4863
4864	// Consider preprocessor directives preceded by block comments as first
4865	// on line.
4866	if (PreviousWasComment)
4867	return FirstNonCommentOnLine \|\| IsFirstOnLine(Tok);
4868	return IsFirstOnLine(Tok);
4869	};
4870
4871	FirstNonCommentOnLine = IsFirstNonCommentOnLine (
4872	FirstNonCommentOnLine, *FormatTok, PreviousWasComment);
4873	PreviousWasComment = FormatTok->is(Kind: tok::comment);
4874
4875	while (!Line ->InPPDirective && FormatTok->is(Kind: tok::hash) &&
4876	FirstNonCommentOnLine) {
4877	// In Verilog, the backtick is used for macro invocations. In TableGen,
4878	// the single hash is used for the paste operator.
4879	const auto *Next = Tokens->peekNextToken();
4880	if ((Style.isVerilog() && !Keywords.isVerilogPPDirective(Tok: *Next)) \|\|
4881	(Style.isTableGen() &&
4882	!Next->isOneOf(K1: tok::kw_else, K2: tok::pp_define, Ks: tok::pp_ifdef,
4883	Ks: tok::pp_ifndef, Ks: tok::pp_endif))) {
4884	break;
4885	}
4886	distributeComments(Comments, NextTok: FormatTok);
4887	Comments.clear();
4888	// If there is an unfinished unwrapped line, we flush the preprocessor
4889	// directives only after that unwrapped line was finished later.
4890	bool SwitchToPreprocessorLines = !Line ->Tokens.empty();
4891	ScopedLineState BlockState(*this, SwitchToPreprocessorLines);
4892	assert((LevelDifference >= `0` \|\|
4893	static_cast<unsigned>(-LevelDifference) <= Line->Level) &&
4894	"LevelDifference makes Line->Level negative");
4895	Line ->Level += LevelDifference;
4896	// Comments stored before the preprocessor directive need to be output
4897	// before the preprocessor directive, at the same level as the
4898	// preprocessor directive, as we consider them to apply to the directive.
4899	if (Style.IndentPPDirectives == FormatStyle::PPDIS_BeforeHash &&
4900	PPBranchLevel > `0`) {
4901	Line ->Level += PPBranchLevel;
4902	}
4903	assert(Line->Level >= Line->UnbracedBodyLevel);
4904	Line ->Level -= Line ->UnbracedBodyLevel;
4905	flushComments(NewlineBeforeNext: isOnNewLine(FormatTok: *FormatTok));
4906	parsePPDirective();
4907	PreviousWasComment = FormatTok->is(Kind: tok::comment);
4908	FirstNonCommentOnLine = IsFirstNonCommentOnLine (
4909	FirstNonCommentOnLine, *FormatTok, PreviousWasComment);
4910	}
4911
4912	if (!PPStack.empty() && (PPStack.back().Kind == PP_Unreachable) &&
4913	!Line ->InPPDirective) {
4914	continue;
4915	}
4916
4917	if (FormatTok->is(Kind: tok::identifier) &&
4918	Macros.defined(Name: FormatTok->TokenText) &&
4919	// FIXME: Allow expanding macros in preprocessor directives.
4920	!Line ->InPPDirective) {
4921	FormatToken *ID = FormatTok;
4922	unsigned Position = Tokens->getPosition();
4923
4924	// To correctly parse the code, we need to replace the tokens of the macro
4925	// call with its expansion.
4926	auto PreCall = std::move(Line);
4927	Line.reset(p: new UnwrappedLine);
4928	bool OldInExpansion = InExpansion;
4929	InExpansion = true;
4930	// We parse the macro call into a new line.
4931	auto Args = parseMacroCall();
4932	InExpansion = OldInExpansion;
4933	assert(Line->Tokens.front().Tok == ID);
4934	// And remember the unexpanded macro call tokens.
4935	auto UnexpandedLine = std::move(Line);
4936	// Reset to the old line.
4937	Line = std::move(PreCall);
4938
4939	LLVM_DEBUG({
4940	llvm::dbgs() << "Macro call: " << ID->TokenText << "(";
4941	if (Args) {
4942	llvm::dbgs() << "(";
4943	for (const auto &Arg : Args.value())
4944	for (const auto &T : Arg)
4945	llvm::dbgs() << T->TokenText << " ";
4946	llvm::dbgs() << ")";
4947	}
4948	llvm::dbgs() << "\n";
4949	});
4950	if (Macros.objectLike(Name: ID->TokenText) && Args &&
4951	!Macros.hasArity(Name: ID->TokenText, Arity: Args ->size())) {
4952	// The macro is either
4953	// - object-like, but we got argumnets, or
4954	// - overloaded to be both object-like and function-like, but none of
4955	// the function-like arities match the number of arguments.
4956	// Thus, expand as object-like macro.
4957	LLVM_DEBUG(llvm::dbgs()
4958	<< "Macro \"" << ID->TokenText
4959	<< "\" not overloaded for arity " << Args->size()
4960	<< "or not function-like, using object-like overload.");
4961	Args.reset();
4962	UnexpandedLine ->Tokens.resize(new_size: `1`);
4963	Tokens->setPosition(Position);
4964	nextToken();
4965	assert(!Args && Macros.objectLike(ID->TokenText));
4966	}
4967	if ((!Args && Macros.objectLike(Name: ID->TokenText)) \|\|
4968	(Args && Macros.hasArity(Name: ID->TokenText, Arity: Args ->size()))) {
4969	// Next, we insert the expanded tokens in the token stream at the
4970	// current position, and continue parsing.
4971	Unexpanded [ID] = std::move(UnexpandedLine);
4972	SmallVector<FormatToken *, `8`> Expansion =
4973	Macros.expand(ID, OptionalArgs: std::move(Args));
4974	if (!Expansion.empty())
4975	FormatTok = Tokens->insertTokens(Tokens: Expansion);
4976
4977	LLVM_DEBUG({
4978	llvm::dbgs() << "Expanded: ";
4979	for (const auto &T : Expansion)
4980	llvm::dbgs() << T->TokenText << " ";
4981	llvm::dbgs() << "\n";
4982	});
4983	} else {
4984	LLVM_DEBUG({
4985	llvm::dbgs() << "Did not expand macro \"" << ID->TokenText
4986	<< "\", because it was used ";
4987	if (Args)
4988	llvm::dbgs() << "with " << Args->size();
4989	else
4990	llvm::dbgs() << "without";
4991	llvm::dbgs() << " arguments, which doesn't match any definition.\n";
4992	});
4993	Tokens->setPosition(Position);
4994	FormatTok = ID;
4995	}
4996	}
4997
4998	if (FormatTok->isNot(Kind: tok::comment)) {
4999	distributeComments(Comments, NextTok: FormatTok);
5000	Comments.clear();
5001	return;
5002	}
5003
5004	Comments.push_back(Elt: FormatTok);
5005	} while (!eof());
5006
5007	distributeComments(Comments, NextTok: nullptr);
5008	Comments.clear();
5009	}
5010
5011	namespace {
5012	template <typename Iterator>
5013	void pushTokens(Iterator Begin, Iterator End,
5014	SmallVectorImpl<FormatToken *> &Into) {
5015	for (auto I = Begin; I != End; ++I) {
5016	Into.push_back(Elt: I->Tok);
5017	for (const auto &Child : I->Children)
5018	pushTokens(Child.Tokens.begin(), Child.Tokens.end(), Into);
5019	}
5020	}
5021	} // namespace
5022
5023	std::optional<llvm::SmallVector<llvm::SmallVector<FormatToken *, `8`>, `1`>>
5024	UnwrappedLineParser::parseMacroCall() {
5025	std::optional<llvm::SmallVector<llvm::SmallVector<FormatToken *, `8`>, `1`>> Args;
5026	assert(Line->Tokens.empty());
5027	nextToken();
5028	if (FormatTok->isNot(Kind: tok::l_paren))
5029	return Args;
5030	unsigned Position = Tokens->getPosition();
5031	FormatToken *Tok = FormatTok;
5032	nextToken();
5033	Args.emplace();
5034	auto ArgStart = std::prev(x: Line ->Tokens.end());
5035
5036	int Parens = `0`;
5037	do {
5038	switch (FormatTok->Tok.getKind()) {
5039	case tok::l_paren:
5040	++Parens;
5041	nextToken();
5042	break;
5043	case tok::r_paren: {
5044	if (Parens > `0`) {
5045	--Parens;
5046	nextToken();
5047	break;
5048	}
5049	Args ->push_back(Elt: {});
5050	pushTokens(Begin: std::next(x: ArgStart), End: Line ->Tokens.end(), Into&: Args ->back());
5051	nextToken();
5052	return Args;
5053	}
5054	case tok::comma: {
5055	if (Parens > `0`) {
5056	nextToken();
5057	break;
5058	}
5059	Args ->push_back(Elt: {});
5060	pushTokens(Begin: std::next(x: ArgStart), End: Line ->Tokens.end(), Into&: Args ->back());
5061	nextToken();
5062	ArgStart = std::prev(x: Line ->Tokens.end());
5063	break;
5064	}
5065	default:
5066	nextToken();
5067	break;
5068	}
5069	} while (!eof());
5070	Line ->Tokens.resize(new_size: `1`);
5071	Tokens->setPosition(Position);
5072	FormatTok = Tok;
5073	return {};
5074	}
5075
5076	void UnwrappedLineParser::pushToken(FormatToken *Tok) {
5077	Line ->Tokens.push_back(x: UnwrappedLineNode (Tok));
5078	if (AtEndOfPPLine) {
5079	auto &Tok = *Line ->Tokens.back().Tok;
5080	Tok.MustBreakBefore = true;
5081	Tok.MustBreakBeforeFinalized = true;
5082	Tok.FirstAfterPPLine = true;
5083	AtEndOfPPLine = false;
5084	}
5085	}
5086
5087	} // end namespace format
5088	} // end namespace clang
5089

Browse the source code of llvm_projects/clang/lib/Format/UnwrappedLineParser.cpp