1 | //===- ThreadSafetyCommon.h -------------------------------------*- C++ -*-===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | // |
9 | // Parts of thread safety analysis that are not specific to thread safety |
10 | // itself have been factored into classes here, where they can be potentially |
11 | // used by other analyses. Currently these include: |
12 | // |
13 | // * Generalize clang CFG visitors. |
14 | // * Conversion of the clang CFG to SSA form. |
15 | // * Translation of clang Exprs to TIL SExprs |
16 | // |
17 | // UNDER CONSTRUCTION. USE AT YOUR OWN RISK. |
18 | // |
19 | //===----------------------------------------------------------------------===// |
20 | |
21 | #ifndef LLVM_CLANG_ANALYSIS_ANALYSES_THREADSAFETYCOMMON_H |
22 | #define LLVM_CLANG_ANALYSIS_ANALYSES_THREADSAFETYCOMMON_H |
23 | |
24 | #include "clang/AST/Decl.h" |
25 | #include "clang/Analysis/Analyses/PostOrderCFGView.h" |
26 | #include "clang/Analysis/Analyses/ThreadSafetyTIL.h" |
27 | #include "clang/Analysis/Analyses/ThreadSafetyTraverse.h" |
28 | #include "clang/Analysis/Analyses/ThreadSafetyUtil.h" |
29 | #include "clang/Analysis/AnalysisDeclContext.h" |
30 | #include "clang/Analysis/CFG.h" |
31 | #include "clang/Basic/LLVM.h" |
32 | #include "llvm/ADT/DenseMap.h" |
33 | #include "llvm/ADT/PointerIntPair.h" |
34 | #include "llvm/ADT/PointerUnion.h" |
35 | #include "llvm/ADT/SmallVector.h" |
36 | #include "llvm/Support/Casting.h" |
37 | #include <sstream> |
38 | #include <string> |
39 | #include <utility> |
40 | #include <vector> |
41 | |
42 | namespace clang { |
43 | |
44 | class AbstractConditionalOperator; |
45 | class ArraySubscriptExpr; |
46 | class BinaryOperator; |
47 | class CallExpr; |
48 | class CastExpr; |
49 | class CXXDestructorDecl; |
50 | class CXXMemberCallExpr; |
51 | class CXXOperatorCallExpr; |
52 | class CXXThisExpr; |
53 | class DeclRefExpr; |
54 | class DeclStmt; |
55 | class Expr; |
56 | class MemberExpr; |
57 | class Stmt; |
58 | class UnaryOperator; |
59 | |
60 | namespace threadSafety { |
61 | |
62 | // Various helper functions on til::SExpr |
63 | namespace sx { |
64 | |
65 | inline bool equals(const til::SExpr *E1, const til::SExpr *E2) { |
66 | return til::EqualsComparator::compareExprs(E1, E2); |
67 | } |
68 | |
69 | inline bool matches(const til::SExpr *E1, const til::SExpr *E2) { |
70 | // We treat a top-level wildcard as the "univsersal" lock. |
71 | // It matches everything for the purpose of checking locks, but not |
72 | // for unlocking them. |
73 | if (isa<til::Wildcard>(Val: E1)) |
74 | return isa<til::Wildcard>(Val: E2); |
75 | if (isa<til::Wildcard>(Val: E2)) |
76 | return isa<til::Wildcard>(Val: E1); |
77 | |
78 | return til::MatchComparator::compareExprs(E1, E2); |
79 | } |
80 | |
81 | inline bool partiallyMatches(const til::SExpr *E1, const til::SExpr *E2) { |
82 | const auto *PE1 = dyn_cast_or_null<til::Project>(Val: E1); |
83 | if (!PE1) |
84 | return false; |
85 | const auto *PE2 = dyn_cast_or_null<til::Project>(Val: E2); |
86 | if (!PE2) |
87 | return false; |
88 | return PE1->clangDecl() == PE2->clangDecl(); |
89 | } |
90 | |
91 | inline std::string toString(const til::SExpr *E) { |
92 | std::stringstream ss; |
93 | til::StdPrinter::print(E, SS&: ss); |
94 | return ss.str(); |
95 | } |
96 | |
97 | } // namespace sx |
98 | |
99 | // This class defines the interface of a clang CFG Visitor. |
100 | // CFGWalker will invoke the following methods. |
101 | // Note that methods are not virtual; the visitor is templatized. |
102 | class CFGVisitor { |
103 | // Enter the CFG for Decl D, and perform any initial setup operations. |
104 | void enterCFG(CFG *Cfg, const NamedDecl *D, const CFGBlock *First) {} |
105 | |
106 | // Enter a CFGBlock. |
107 | void enterCFGBlock(const CFGBlock *B) {} |
108 | |
109 | // Returns true if this visitor implements handlePredecessor |
110 | bool visitPredecessors() { return true; } |
111 | |
112 | // Process a predecessor edge. |
113 | void handlePredecessor(const CFGBlock *Pred) {} |
114 | |
115 | // Process a successor back edge to a previously visited block. |
116 | void handlePredecessorBackEdge(const CFGBlock *Pred) {} |
117 | |
118 | // Called just before processing statements. |
119 | void enterCFGBlockBody(const CFGBlock *B) {} |
120 | |
121 | // Process an ordinary statement. |
122 | void handleStatement(const Stmt *S) {} |
123 | |
124 | // Process a destructor call |
125 | void handleDestructorCall(const VarDecl *VD, const CXXDestructorDecl *DD) {} |
126 | |
127 | // Called after all statements have been handled. |
128 | void exitCFGBlockBody(const CFGBlock *B) {} |
129 | |
130 | // Return true |
131 | bool visitSuccessors() { return true; } |
132 | |
133 | // Process a successor edge. |
134 | void handleSuccessor(const CFGBlock *Succ) {} |
135 | |
136 | // Process a successor back edge to a previously visited block. |
137 | void handleSuccessorBackEdge(const CFGBlock *Succ) {} |
138 | |
139 | // Leave a CFGBlock. |
140 | void exitCFGBlock(const CFGBlock *B) {} |
141 | |
142 | // Leave the CFG, and perform any final cleanup operations. |
143 | void exitCFG(const CFGBlock *Last) {} |
144 | }; |
145 | |
146 | // Walks the clang CFG, and invokes methods on a given CFGVisitor. |
147 | class CFGWalker { |
148 | public: |
149 | CFGWalker() = default; |
150 | |
151 | // Initialize the CFGWalker. This setup only needs to be done once, even |
152 | // if there are multiple passes over the CFG. |
153 | bool init(AnalysisDeclContext &AC) { |
154 | ACtx = &AC; |
155 | CFGraph = AC.getCFG(); |
156 | if (!CFGraph) |
157 | return false; |
158 | |
159 | // Ignore anonymous functions. |
160 | if (!isa_and_nonnull<NamedDecl>(Val: AC.getDecl())) |
161 | return false; |
162 | |
163 | SortedGraph = AC.getAnalysis<PostOrderCFGView>(); |
164 | if (!SortedGraph) |
165 | return false; |
166 | |
167 | return true; |
168 | } |
169 | |
170 | // Traverse the CFG, calling methods on V as appropriate. |
171 | template <class Visitor> |
172 | void walk(Visitor &V) { |
173 | PostOrderCFGView::CFGBlockSet VisitedBlocks(CFGraph); |
174 | |
175 | V.enterCFG(CFGraph, getDecl(), &CFGraph->getEntry()); |
176 | |
177 | for (const auto *CurrBlock : *SortedGraph) { |
178 | VisitedBlocks.insert(Block: CurrBlock); |
179 | |
180 | V.enterCFGBlock(CurrBlock); |
181 | |
182 | // Process predecessors, handling back edges last |
183 | if (V.visitPredecessors()) { |
184 | SmallVector<CFGBlock*, 4> BackEdges; |
185 | // Process successors |
186 | for (CFGBlock::const_pred_iterator SI = CurrBlock->pred_begin(), |
187 | SE = CurrBlock->pred_end(); |
188 | SI != SE; ++SI) { |
189 | if (*SI == nullptr) |
190 | continue; |
191 | |
192 | if (!VisitedBlocks.alreadySet(Block: *SI)) { |
193 | BackEdges.push_back(Elt: *SI); |
194 | continue; |
195 | } |
196 | V.handlePredecessor(*SI); |
197 | } |
198 | |
199 | for (auto *Blk : BackEdges) |
200 | V.handlePredecessorBackEdge(Blk); |
201 | } |
202 | |
203 | V.enterCFGBlockBody(CurrBlock); |
204 | |
205 | // Process statements |
206 | for (const auto &BI : *CurrBlock) { |
207 | switch (BI.getKind()) { |
208 | case CFGElement::Statement: |
209 | V.handleStatement(BI.castAs<CFGStmt>().getStmt()); |
210 | break; |
211 | |
212 | case CFGElement::AutomaticObjectDtor: { |
213 | CFGAutomaticObjDtor AD = BI.castAs<CFGAutomaticObjDtor>(); |
214 | auto *DD = const_cast<CXXDestructorDecl *>( |
215 | AD.getDestructorDecl(astContext&: ACtx->getASTContext())); |
216 | auto *VD = const_cast<VarDecl *>(AD.getVarDecl()); |
217 | V.handleDestructorCall(VD, DD); |
218 | break; |
219 | } |
220 | default: |
221 | break; |
222 | } |
223 | } |
224 | |
225 | V.exitCFGBlockBody(CurrBlock); |
226 | |
227 | // Process successors, handling back edges first. |
228 | if (V.visitSuccessors()) { |
229 | SmallVector<CFGBlock*, 8> ForwardEdges; |
230 | |
231 | // Process successors |
232 | for (CFGBlock::const_succ_iterator SI = CurrBlock->succ_begin(), |
233 | SE = CurrBlock->succ_end(); |
234 | SI != SE; ++SI) { |
235 | if (*SI == nullptr) |
236 | continue; |
237 | |
238 | if (!VisitedBlocks.alreadySet(Block: *SI)) { |
239 | ForwardEdges.push_back(Elt: *SI); |
240 | continue; |
241 | } |
242 | V.handleSuccessorBackEdge(*SI); |
243 | } |
244 | |
245 | for (auto *Blk : ForwardEdges) |
246 | V.handleSuccessor(Blk); |
247 | } |
248 | |
249 | V.exitCFGBlock(CurrBlock); |
250 | } |
251 | V.exitCFG(&CFGraph->getExit()); |
252 | } |
253 | |
254 | const CFG *getGraph() const { return CFGraph; } |
255 | CFG *getGraph() { return CFGraph; } |
256 | |
257 | const NamedDecl *getDecl() const { |
258 | return dyn_cast<NamedDecl>(Val: ACtx->getDecl()); |
259 | } |
260 | |
261 | const PostOrderCFGView *getSortedGraph() const { return SortedGraph; } |
262 | |
263 | private: |
264 | CFG *CFGraph = nullptr; |
265 | AnalysisDeclContext *ACtx = nullptr; |
266 | PostOrderCFGView *SortedGraph = nullptr; |
267 | }; |
268 | |
269 | // TODO: move this back into ThreadSafety.cpp |
270 | // This is specific to thread safety. It is here because |
271 | // translateAttrExpr needs it, but that should be moved too. |
272 | class CapabilityExpr { |
273 | private: |
274 | /// The capability expression and whether it's negated. |
275 | llvm::PointerIntPair<const til::SExpr *, 1, bool> CapExpr; |
276 | |
277 | /// The kind of capability as specified by @ref CapabilityAttr::getName. |
278 | StringRef CapKind; |
279 | |
280 | public: |
281 | CapabilityExpr() : CapExpr(nullptr, false) {} |
282 | CapabilityExpr(const til::SExpr *E, StringRef Kind, bool Neg) |
283 | : CapExpr(E, Neg), CapKind(Kind) {} |
284 | |
285 | // Don't allow implicitly-constructed StringRefs since we'll capture them. |
286 | template <typename T> CapabilityExpr(const til::SExpr *, T, bool) = delete; |
287 | |
288 | const til::SExpr *sexpr() const { return CapExpr.getPointer(); } |
289 | StringRef getKind() const { return CapKind; } |
290 | bool negative() const { return CapExpr.getInt(); } |
291 | |
292 | CapabilityExpr operator!() const { |
293 | return CapabilityExpr(CapExpr.getPointer(), CapKind, !CapExpr.getInt()); |
294 | } |
295 | |
296 | bool equals(const CapabilityExpr &other) const { |
297 | return (negative() == other.negative()) && |
298 | sx::equals(E1: sexpr(), E2: other.sexpr()); |
299 | } |
300 | |
301 | bool matches(const CapabilityExpr &other) const { |
302 | return (negative() == other.negative()) && |
303 | sx::matches(E1: sexpr(), E2: other.sexpr()); |
304 | } |
305 | |
306 | bool matchesUniv(const CapabilityExpr &CapE) const { |
307 | return isUniversal() || matches(other: CapE); |
308 | } |
309 | |
310 | bool partiallyMatches(const CapabilityExpr &other) const { |
311 | return (negative() == other.negative()) && |
312 | sx::partiallyMatches(E1: sexpr(), E2: other.sexpr()); |
313 | } |
314 | |
315 | const ValueDecl* valueDecl() const { |
316 | if (negative() || sexpr() == nullptr) |
317 | return nullptr; |
318 | if (const auto *P = dyn_cast<til::Project>(Val: sexpr())) |
319 | return P->clangDecl(); |
320 | if (const auto *P = dyn_cast<til::LiteralPtr>(Val: sexpr())) |
321 | return P->clangDecl(); |
322 | return nullptr; |
323 | } |
324 | |
325 | std::string toString() const { |
326 | if (negative()) |
327 | return "!" + sx::toString(E: sexpr()); |
328 | return sx::toString(E: sexpr()); |
329 | } |
330 | |
331 | bool shouldIgnore() const { return sexpr() == nullptr; } |
332 | |
333 | bool isInvalid() const { return isa_and_nonnull<til::Undefined>(Val: sexpr()); } |
334 | |
335 | bool isUniversal() const { return isa_and_nonnull<til::Wildcard>(Val: sexpr()); } |
336 | }; |
337 | |
338 | // Translate clang::Expr to til::SExpr. |
339 | class SExprBuilder { |
340 | public: |
341 | /// Encapsulates the lexical context of a function call. The lexical |
342 | /// context includes the arguments to the call, including the implicit object |
343 | /// argument. When an attribute containing a mutex expression is attached to |
344 | /// a method, the expression may refer to formal parameters of the method. |
345 | /// Actual arguments must be substituted for formal parameters to derive |
346 | /// the appropriate mutex expression in the lexical context where the function |
347 | /// is called. PrevCtx holds the context in which the arguments themselves |
348 | /// should be evaluated; multiple calling contexts can be chained together |
349 | /// by the lock_returned attribute. |
350 | struct CallingContext { |
351 | // The previous context; or 0 if none. |
352 | CallingContext *Prev; |
353 | |
354 | // The decl to which the attr is attached. |
355 | const NamedDecl *AttrDecl; |
356 | |
357 | // Implicit object argument -- e.g. 'this' |
358 | llvm::PointerUnion<const Expr *, til::SExpr *> SelfArg = nullptr; |
359 | |
360 | // Number of funArgs |
361 | unsigned NumArgs = 0; |
362 | |
363 | // Function arguments |
364 | llvm::PointerUnion<const Expr *const *, til::SExpr *> FunArgs = nullptr; |
365 | |
366 | // is Self referred to with -> or .? |
367 | bool SelfArrow = false; |
368 | |
369 | CallingContext(CallingContext *P, const NamedDecl *D = nullptr) |
370 | : Prev(P), AttrDecl(D) {} |
371 | }; |
372 | |
373 | SExprBuilder(til::MemRegionRef A) : Arena(A) { |
374 | // FIXME: we don't always have a self-variable. |
375 | SelfVar = new (Arena) til::Variable(nullptr); |
376 | SelfVar->setKind(til::Variable::VK_SFun); |
377 | } |
378 | |
379 | // Translate a clang expression in an attribute to a til::SExpr. |
380 | // Constructs the context from D, DeclExp, and SelfDecl. |
381 | CapabilityExpr translateAttrExpr(const Expr *AttrExp, const NamedDecl *D, |
382 | const Expr *DeclExp, |
383 | til::SExpr *Self = nullptr); |
384 | |
385 | CapabilityExpr translateAttrExpr(const Expr *AttrExp, CallingContext *Ctx); |
386 | |
387 | // Translate a variable reference. |
388 | til::LiteralPtr *createVariable(const VarDecl *VD); |
389 | |
390 | // Create placeholder for this: we don't know the VarDecl on construction yet. |
391 | std::pair<til::LiteralPtr *, StringRef> |
392 | createThisPlaceholder(const Expr *Exp); |
393 | |
394 | // Translate a clang statement or expression to a TIL expression. |
395 | // Also performs substitution of variables; Ctx provides the context. |
396 | // Dispatches on the type of S. |
397 | til::SExpr *translate(const Stmt *S, CallingContext *Ctx); |
398 | til::SCFG *buildCFG(CFGWalker &Walker); |
399 | |
400 | til::SExpr *lookupStmt(const Stmt *S); |
401 | |
402 | til::BasicBlock *lookupBlock(const CFGBlock *B) { |
403 | return BlockMap[B->getBlockID()]; |
404 | } |
405 | |
406 | const til::SCFG *getCFG() const { return Scfg; } |
407 | til::SCFG *getCFG() { return Scfg; } |
408 | |
409 | private: |
410 | // We implement the CFGVisitor API |
411 | friend class CFGWalker; |
412 | |
413 | til::SExpr *translateDeclRefExpr(const DeclRefExpr *DRE, |
414 | CallingContext *Ctx) ; |
415 | til::SExpr *translateCXXThisExpr(const CXXThisExpr *TE, CallingContext *Ctx); |
416 | til::SExpr *translateMemberExpr(const MemberExpr *ME, CallingContext *Ctx); |
417 | til::SExpr *translateObjCIVarRefExpr(const ObjCIvarRefExpr *IVRE, |
418 | CallingContext *Ctx); |
419 | til::SExpr *translateCallExpr(const CallExpr *CE, CallingContext *Ctx, |
420 | const Expr *SelfE = nullptr); |
421 | til::SExpr *translateCXXMemberCallExpr(const CXXMemberCallExpr *ME, |
422 | CallingContext *Ctx); |
423 | til::SExpr *translateCXXOperatorCallExpr(const CXXOperatorCallExpr *OCE, |
424 | CallingContext *Ctx); |
425 | til::SExpr *translateUnaryOperator(const UnaryOperator *UO, |
426 | CallingContext *Ctx); |
427 | til::SExpr *translateBinOp(til::TIL_BinaryOpcode Op, |
428 | const BinaryOperator *BO, |
429 | CallingContext *Ctx, bool Reverse = false); |
430 | til::SExpr *translateBinAssign(til::TIL_BinaryOpcode Op, |
431 | const BinaryOperator *BO, |
432 | CallingContext *Ctx, bool Assign = false); |
433 | til::SExpr *translateBinaryOperator(const BinaryOperator *BO, |
434 | CallingContext *Ctx); |
435 | til::SExpr *translateCastExpr(const CastExpr *CE, CallingContext *Ctx); |
436 | til::SExpr *translateArraySubscriptExpr(const ArraySubscriptExpr *E, |
437 | CallingContext *Ctx); |
438 | til::SExpr *translateAbstractConditionalOperator( |
439 | const AbstractConditionalOperator *C, CallingContext *Ctx); |
440 | |
441 | til::SExpr *translateDeclStmt(const DeclStmt *S, CallingContext *Ctx); |
442 | |
443 | // Map from statements in the clang CFG to SExprs in the til::SCFG. |
444 | using StatementMap = llvm::DenseMap<const Stmt *, til::SExpr *>; |
445 | |
446 | // Map from clang local variables to indices in a LVarDefinitionMap. |
447 | using LVarIndexMap = llvm::DenseMap<const ValueDecl *, unsigned>; |
448 | |
449 | // Map from local variable indices to SSA variables (or constants). |
450 | using NameVarPair = std::pair<const ValueDecl *, til::SExpr *>; |
451 | using LVarDefinitionMap = CopyOnWriteVector<NameVarPair>; |
452 | |
453 | struct BlockInfo { |
454 | LVarDefinitionMap ExitMap; |
455 | bool HasBackEdges = false; |
456 | |
457 | // Successors yet to be processed |
458 | unsigned UnprocessedSuccessors = 0; |
459 | |
460 | // Predecessors already processed |
461 | unsigned ProcessedPredecessors = 0; |
462 | |
463 | BlockInfo() = default; |
464 | BlockInfo(BlockInfo &&) = default; |
465 | BlockInfo &operator=(BlockInfo &&) = default; |
466 | }; |
467 | |
468 | void enterCFG(CFG *Cfg, const NamedDecl *D, const CFGBlock *First); |
469 | void enterCFGBlock(const CFGBlock *B); |
470 | bool visitPredecessors() { return true; } |
471 | void handlePredecessor(const CFGBlock *Pred); |
472 | void handlePredecessorBackEdge(const CFGBlock *Pred); |
473 | void enterCFGBlockBody(const CFGBlock *B); |
474 | void handleStatement(const Stmt *S); |
475 | void handleDestructorCall(const VarDecl *VD, const CXXDestructorDecl *DD); |
476 | void exitCFGBlockBody(const CFGBlock *B); |
477 | bool visitSuccessors() { return true; } |
478 | void handleSuccessor(const CFGBlock *Succ); |
479 | void handleSuccessorBackEdge(const CFGBlock *Succ); |
480 | void exitCFGBlock(const CFGBlock *B); |
481 | void exitCFG(const CFGBlock *Last); |
482 | |
483 | void insertStmt(const Stmt *S, til::SExpr *E) { |
484 | SMap.insert(KV: std::make_pair(x&: S, y&: E)); |
485 | } |
486 | |
487 | til::SExpr *addStatement(til::SExpr *E, const Stmt *S, |
488 | const ValueDecl *VD = nullptr); |
489 | til::SExpr *lookupVarDecl(const ValueDecl *VD); |
490 | til::SExpr *addVarDecl(const ValueDecl *VD, til::SExpr *E); |
491 | til::SExpr *updateVarDecl(const ValueDecl *VD, til::SExpr *E); |
492 | |
493 | void makePhiNodeVar(unsigned i, unsigned NPreds, til::SExpr *E); |
494 | void mergeEntryMap(LVarDefinitionMap Map); |
495 | void mergeEntryMapBackEdge(); |
496 | void mergePhiNodesBackEdge(const CFGBlock *Blk); |
497 | |
498 | private: |
499 | // Set to true when parsing capability expressions, which get translated |
500 | // inaccurately in order to hack around smart pointers etc. |
501 | static const bool CapabilityExprMode = true; |
502 | |
503 | til::MemRegionRef Arena; |
504 | |
505 | // Variable to use for 'this'. May be null. |
506 | til::Variable *SelfVar = nullptr; |
507 | |
508 | til::SCFG *Scfg = nullptr; |
509 | |
510 | // Map from Stmt to TIL Variables |
511 | StatementMap SMap; |
512 | |
513 | // Indices of clang local vars. |
514 | LVarIndexMap LVarIdxMap; |
515 | |
516 | // Map from clang to til BBs. |
517 | std::vector<til::BasicBlock *> BlockMap; |
518 | |
519 | // Extra information per BB. Indexed by clang BlockID. |
520 | std::vector<BlockInfo> BBInfo; |
521 | |
522 | LVarDefinitionMap CurrentLVarMap; |
523 | std::vector<til::Phi *> CurrentArguments; |
524 | std::vector<til::SExpr *> CurrentInstructions; |
525 | std::vector<til::Phi *> IncompleteArgs; |
526 | til::BasicBlock *CurrentBB = nullptr; |
527 | BlockInfo *CurrentBlockInfo = nullptr; |
528 | }; |
529 | |
530 | #ifndef NDEBUG |
531 | // Dump an SCFG to llvm::errs(). |
532 | void printSCFG(CFGWalker &Walker); |
533 | #endif // NDEBUG |
534 | |
535 | } // namespace threadSafety |
536 | } // namespace clang |
537 | |
538 | #endif // LLVM_CLANG_ANALYSIS_ANALYSES_THREADSAFETYCOMMON_H |
539 | |