1 | //===--- CloneChecker.cpp - Clone detection checker -------------*- C++ -*-===// |
2 | // |
3 | // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. |
4 | // See https://llvm.org/LICENSE.txt for license information. |
5 | // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception |
6 | // |
7 | //===----------------------------------------------------------------------===// |
8 | /// |
9 | /// \file |
10 | /// CloneChecker is a checker that reports clones in the current translation |
11 | /// unit. |
12 | /// |
13 | //===----------------------------------------------------------------------===// |
14 | |
15 | #include "clang/StaticAnalyzer/Checkers/BuiltinCheckerRegistration.h" |
16 | #include "clang/Analysis/CloneDetection.h" |
17 | #include "clang/Basic/Diagnostic.h" |
18 | #include "clang/StaticAnalyzer/Core/BugReporter/BugType.h" |
19 | #include "clang/StaticAnalyzer/Core/Checker.h" |
20 | #include "clang/StaticAnalyzer/Core/CheckerManager.h" |
21 | #include "clang/StaticAnalyzer/Core/PathSensitive/AnalysisManager.h" |
22 | #include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h" |
23 | |
24 | using namespace clang; |
25 | using namespace ento; |
26 | |
27 | namespace { |
28 | class CloneChecker |
29 | : public Checker<check::ASTCodeBody, check::EndOfTranslationUnit> { |
30 | public: |
31 | // Checker options. |
32 | int MinComplexity; |
33 | bool ReportNormalClones = false; |
34 | StringRef IgnoredFilesPattern; |
35 | |
36 | private: |
37 | mutable CloneDetector Detector; |
38 | const BugType BT_Exact{this, "Exact code clone" , "Code clone" }; |
39 | const BugType BT_Suspicious{this, "Suspicious code clone" , "Code clone" }; |
40 | |
41 | public: |
42 | void checkASTCodeBody(const Decl *D, AnalysisManager &Mgr, |
43 | BugReporter &BR) const; |
44 | |
45 | void checkEndOfTranslationUnit(const TranslationUnitDecl *TU, |
46 | AnalysisManager &Mgr, BugReporter &BR) const; |
47 | |
48 | /// Reports all clones to the user. |
49 | void reportClones(BugReporter &BR, AnalysisManager &Mgr, |
50 | std::vector<CloneDetector::CloneGroup> &CloneGroups) const; |
51 | |
52 | /// Reports only suspicious clones to the user along with information |
53 | /// that explain why they are suspicious. |
54 | void reportSuspiciousClones( |
55 | BugReporter &BR, AnalysisManager &Mgr, |
56 | std::vector<CloneDetector::CloneGroup> &CloneGroups) const; |
57 | }; |
58 | } // end anonymous namespace |
59 | |
60 | void CloneChecker::checkASTCodeBody(const Decl *D, AnalysisManager &Mgr, |
61 | BugReporter &BR) const { |
62 | // Every statement that should be included in the search for clones needs to |
63 | // be passed to the CloneDetector. |
64 | Detector.analyzeCodeBody(D); |
65 | } |
66 | |
67 | void CloneChecker::checkEndOfTranslationUnit(const TranslationUnitDecl *TU, |
68 | AnalysisManager &Mgr, |
69 | BugReporter &BR) const { |
70 | // At this point, every statement in the translation unit has been analyzed by |
71 | // the CloneDetector. The only thing left to do is to report the found clones. |
72 | |
73 | // Let the CloneDetector create a list of clones from all the analyzed |
74 | // statements. We don't filter for matching variable patterns at this point |
75 | // because reportSuspiciousClones() wants to search them for errors. |
76 | std::vector<CloneDetector::CloneGroup> AllCloneGroups; |
77 | |
78 | Detector.findClones( |
79 | Result&: AllCloneGroups, ConstraintList: FilenamePatternConstraint(IgnoredFilesPattern), |
80 | ConstraintList: RecursiveCloneTypeIIHashConstraint(), ConstraintList: MinGroupSizeConstraint(2), |
81 | ConstraintList: MinComplexityConstraint(MinComplexity), |
82 | ConstraintList: RecursiveCloneTypeIIVerifyConstraint(), ConstraintList: OnlyLargestCloneConstraint()); |
83 | |
84 | reportSuspiciousClones(BR, Mgr, CloneGroups&: AllCloneGroups); |
85 | |
86 | // We are done for this translation unit unless we also need to report normal |
87 | // clones. |
88 | if (!ReportNormalClones) |
89 | return; |
90 | |
91 | // Now that the suspicious clone detector has checked for pattern errors, |
92 | // we also filter all clones who don't have matching patterns |
93 | CloneDetector::constrainClones(CloneGroups&: AllCloneGroups, |
94 | C: MatchingVariablePatternConstraint(), |
95 | ConstraintList: MinGroupSizeConstraint(2)); |
96 | |
97 | reportClones(BR, Mgr, CloneGroups&: AllCloneGroups); |
98 | } |
99 | |
100 | static PathDiagnosticLocation makeLocation(const StmtSequence &S, |
101 | AnalysisManager &Mgr) { |
102 | ASTContext &ACtx = Mgr.getASTContext(); |
103 | return PathDiagnosticLocation::createBegin( |
104 | S: S.front(), SM: ACtx.getSourceManager(), |
105 | LAC: Mgr.getAnalysisDeclContext(D: ACtx.getTranslationUnitDecl())); |
106 | } |
107 | |
108 | void CloneChecker::reportClones( |
109 | BugReporter &BR, AnalysisManager &Mgr, |
110 | std::vector<CloneDetector::CloneGroup> &CloneGroups) const { |
111 | for (const CloneDetector::CloneGroup &Group : CloneGroups) { |
112 | // We group the clones by printing the first as a warning and all others |
113 | // as a note. |
114 | auto R = std::make_unique<BasicBugReport>( |
115 | args: BT_Exact, args: "Duplicate code detected" , args: makeLocation(S: Group.front(), Mgr)); |
116 | R->addRange(R: Group.front().getSourceRange()); |
117 | |
118 | for (unsigned i = 1; i < Group.size(); ++i) |
119 | R->addNote(Msg: "Similar code here" , Pos: makeLocation(S: Group[i], Mgr), |
120 | Ranges: Group[i].getSourceRange()); |
121 | BR.emitReport(R: std::move(R)); |
122 | } |
123 | } |
124 | |
125 | void CloneChecker::reportSuspiciousClones( |
126 | BugReporter &BR, AnalysisManager &Mgr, |
127 | std::vector<CloneDetector::CloneGroup> &CloneGroups) const { |
128 | std::vector<VariablePattern::SuspiciousClonePair> Pairs; |
129 | |
130 | for (const CloneDetector::CloneGroup &Group : CloneGroups) { |
131 | for (unsigned i = 0; i < Group.size(); ++i) { |
132 | VariablePattern PatternA(Group[i]); |
133 | |
134 | for (unsigned j = i + 1; j < Group.size(); ++j) { |
135 | VariablePattern PatternB(Group[j]); |
136 | |
137 | VariablePattern::SuspiciousClonePair ClonePair; |
138 | // For now, we only report clones which break the variable pattern just |
139 | // once because multiple differences in a pattern are an indicator that |
140 | // those differences are maybe intended (e.g. because it's actually a |
141 | // different algorithm). |
142 | // FIXME: In very big clones even multiple variables can be unintended, |
143 | // so replacing this number with a percentage could better handle such |
144 | // cases. On the other hand it could increase the false-positive rate |
145 | // for all clones if the percentage is too high. |
146 | if (PatternA.countPatternDifferences(Other: PatternB, FirstMismatch: &ClonePair) == 1) { |
147 | Pairs.push_back(x: ClonePair); |
148 | break; |
149 | } |
150 | } |
151 | } |
152 | } |
153 | |
154 | ASTContext &ACtx = BR.getContext(); |
155 | SourceManager &SM = ACtx.getSourceManager(); |
156 | AnalysisDeclContext *ADC = |
157 | Mgr.getAnalysisDeclContext(D: ACtx.getTranslationUnitDecl()); |
158 | |
159 | for (VariablePattern::SuspiciousClonePair &Pair : Pairs) { |
160 | // FIXME: We are ignoring the suggestions currently, because they are |
161 | // only 50% accurate (even if the second suggestion is unavailable), |
162 | // which may confuse the user. |
163 | // Think how to perform more accurate suggestions? |
164 | |
165 | auto R = std::make_unique<BasicBugReport>( |
166 | args: BT_Suspicious, |
167 | args: "Potential copy-paste error; did you really mean to use '" + |
168 | Pair.FirstCloneInfo.Variable->getNameAsString() + "' here?" , |
169 | args: PathDiagnosticLocation::createBegin(S: Pair.FirstCloneInfo.Mention, SM, |
170 | LAC: ADC)); |
171 | R->addRange(R: Pair.FirstCloneInfo.Mention->getSourceRange()); |
172 | |
173 | R->addNote(Msg: "Similar code using '" + |
174 | Pair.SecondCloneInfo.Variable->getNameAsString() + "' here" , |
175 | Pos: PathDiagnosticLocation::createBegin(S: Pair.SecondCloneInfo.Mention, |
176 | SM, LAC: ADC), |
177 | Ranges: Pair.SecondCloneInfo.Mention->getSourceRange()); |
178 | |
179 | BR.emitReport(R: std::move(R)); |
180 | } |
181 | } |
182 | |
183 | //===----------------------------------------------------------------------===// |
184 | // Register CloneChecker |
185 | //===----------------------------------------------------------------------===// |
186 | |
187 | void ento::registerCloneChecker(CheckerManager &Mgr) { |
188 | auto *Checker = Mgr.registerChecker<CloneChecker>(); |
189 | |
190 | Checker->MinComplexity = Mgr.getAnalyzerOptions().getCheckerIntegerOption( |
191 | C: Checker, OptionName: "MinimumCloneComplexity" ); |
192 | |
193 | if (Checker->MinComplexity < 0) |
194 | Mgr.reportInvalidCheckerOptionValue( |
195 | C: Checker, OptionName: "MinimumCloneComplexity" , ExpectedValueDesc: "a non-negative value" ); |
196 | |
197 | Checker->ReportNormalClones = Mgr.getAnalyzerOptions().getCheckerBooleanOption( |
198 | C: Checker, OptionName: "ReportNormalClones" ); |
199 | |
200 | Checker->IgnoredFilesPattern = Mgr.getAnalyzerOptions() |
201 | .getCheckerStringOption(C: Checker, OptionName: "IgnoredFilesPattern" ); |
202 | } |
203 | |
204 | bool ento::shouldRegisterCloneChecker(const CheckerManager &mgr) { |
205 | return true; |
206 | } |
207 | |