1 //===- CalledOnceCheck.cpp - Check 'called once' parameters ---------------===//
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
7 //===----------------------------------------------------------------------===//
9 #include "clang/Analysis/Analyses/CalledOnceCheck.h"
10 #include "clang/AST/ASTContext.h"
11 #include "clang/AST/Attr.h"
12 #include "clang/AST/Decl.h"
13 #include "clang/AST/DeclBase.h"
14 #include "clang/AST/Expr.h"
15 #include "clang/AST/ExprObjC.h"
16 #include "clang/AST/OperationKinds.h"
17 #include "clang/AST/ParentMap.h"
18 #include "clang/AST/RecursiveASTVisitor.h"
19 #include "clang/AST/Stmt.h"
20 #include "clang/AST/StmtObjC.h"
21 #include "clang/AST/StmtVisitor.h"
22 #include "clang/AST/Type.h"
23 #include "clang/Analysis/AnalysisDeclContext.h"
24 #include "clang/Analysis/CFG.h"
25 #include "clang/Analysis/FlowSensitive/DataflowWorklist.h"
26 #include "clang/Basic/Builtins.h"
27 #include "clang/Basic/IdentifierTable.h"
28 #include "clang/Basic/LLVM.h"
29 #include "llvm/ADT/BitVector.h"
30 #include "llvm/ADT/BitmaskEnum.h"
31 #include "llvm/ADT/PointerIntPair.h"
32 #include "llvm/ADT/STLExtras.h"
33 #include "llvm/ADT/Sequence.h"
34 #include "llvm/ADT/SmallVector.h"
35 #include "llvm/ADT/StringRef.h"
36 #include "llvm/Support/Casting.h"
37 #include "llvm/Support/Compiler.h"
38 #include "llvm/Support/ErrorHandling.h"
42 using namespace clang
;
45 static constexpr unsigned EXPECTED_MAX_NUMBER_OF_PARAMS
= 2;
47 using ParamSizedVector
= llvm::SmallVector
<T
, EXPECTED_MAX_NUMBER_OF_PARAMS
>;
48 static constexpr unsigned EXPECTED_NUMBER_OF_BASIC_BLOCKS
= 8;
50 using CFGSizedVector
= llvm::SmallVector
<T
, EXPECTED_NUMBER_OF_BASIC_BLOCKS
>;
51 constexpr llvm::StringLiteral CONVENTIONAL_NAMES
[] = {
52 "completionHandler", "completion", "withCompletionHandler",
53 "withCompletion", "completionBlock", "withCompletionBlock",
54 "replyTo", "reply", "withReplyTo"};
55 constexpr llvm::StringLiteral CONVENTIONAL_SUFFIXES
[] = {
56 "WithCompletionHandler", "WithCompletion", "WithCompletionBlock",
57 "WithReplyTo", "WithReply"};
58 constexpr llvm::StringLiteral CONVENTIONAL_CONDITIONS
[] = {
59 "error", "cancel", "shouldCall", "done", "OK", "success"};
61 struct KnownCalledOnceParameter
{
62 llvm::StringLiteral FunctionName
;
65 constexpr KnownCalledOnceParameter KNOWN_CALLED_ONCE_PARAMETERS
[] = {
66 {llvm::StringLiteral
{"dispatch_async"}, 1},
67 {llvm::StringLiteral
{"dispatch_async_and_wait"}, 1},
68 {llvm::StringLiteral
{"dispatch_after"}, 2},
69 {llvm::StringLiteral
{"dispatch_sync"}, 1},
70 {llvm::StringLiteral
{"dispatch_once"}, 1},
71 {llvm::StringLiteral
{"dispatch_barrier_async"}, 1},
72 {llvm::StringLiteral
{"dispatch_barrier_async_and_wait"}, 1},
73 {llvm::StringLiteral
{"dispatch_barrier_sync"}, 1}};
75 class ParameterStatus
{
77 // Status kind is basically the main part of parameter's status.
78 // The kind represents our knowledge (so far) about a tracked parameter
79 // in the context of this analysis.
81 // Since we want to report on missing and extraneous calls, we need to
82 // track the fact whether paramater was called or not. This automatically
83 // decides two kinds: `NotCalled` and `Called`.
85 // One of the erroneous situations is the case when parameter is called only
86 // on some of the paths. We could've considered it `NotCalled`, but we want
87 // to report double call warnings even if these two calls are not guaranteed
88 // to happen in every execution. We also don't want to have it as `Called`
89 // because not calling tracked parameter on all of the paths is an error
90 // on its own. For these reasons, we need to have a separate kind,
91 // `MaybeCalled`, and change `Called` to `DefinitelyCalled` to avoid
94 // Two violations of calling parameter more than once and not calling it on
95 // every path are not, however, mutually exclusive. In situations where both
96 // violations take place, we prefer to report ONLY double call. It's always
97 // harder to pinpoint a bug that has arisen when a user neglects to take the
98 // right action (and therefore, no action is taken), than when a user takes
99 // the wrong action. And, in order to remember that we already reported
100 // a double call, we need another kind: `Reported`.
102 // Our analysis is intra-procedural and, while in the perfect world,
103 // developers only use tracked parameters to call them, in the real world,
104 // the picture might be different. Parameters can be stored in global
105 // variables or leaked into other functions that we know nothing about.
106 // We try to be lenient and trust users. Another kind `Escaped` reflects
107 // such situations. We don't know if it gets called there or not, but we
108 // should always think of `Escaped` as the best possible option.
110 // Some of the paths in the analyzed functions might end with a call
111 // to noreturn functions. Such paths are not required to have parameter
112 // calls and we want to track that. For the purposes of better diagnostics,
113 // we don't want to reuse `Escaped` and, thus, have another kind `NoReturn`.
115 // Additionally, we have `NotVisited` kind that tells us nothing about
116 // a tracked parameter, but is used for tracking analyzed (aka visited)
119 // If we consider `|` to be a JOIN operation of two kinds coming from
120 // two different paths, the following properties must hold:
122 // 1. for any Kind K: K | K == K
123 // Joining two identical kinds should result in the same kind.
125 // 2. for any Kind K: Reported | K == Reported
126 // Doesn't matter on which path it was reported, it still is.
128 // 3. for any Kind K: NoReturn | K == K
129 // We can totally ignore noreturn paths during merges.
131 // 4. DefinitelyCalled | NotCalled == MaybeCalled
132 // Called on one path, not called on another - that's simply
133 // a definition for MaybeCalled.
135 // 5. for any Kind K in [DefinitelyCalled, NotCalled, MaybeCalled]:
137 // Escaped mirrors other statuses after joins.
138 // Every situation, when we join any of the listed kinds K,
139 // is a violation. For this reason, in order to assume the
140 // best outcome for this escape, we consider it to be the
141 // same as the other path.
143 // 6. for any Kind K in [DefinitelyCalled, NotCalled]:
144 // MaybeCalled | K == MaybeCalled
145 // MaybeCalled should basically stay after almost every join.
147 // No-return paths should be absolutely transparent for the analysis.
148 // 0x0 is the identity element for selected join operation (binary or).
149 NoReturn
= 0x0, /* 0000 */
150 // Escaped marks situations when marked parameter escaped into
151 // another function (so we can assume that it was possibly called there).
152 Escaped
= 0x1, /* 0001 */
153 // Parameter was definitely called once at this point.
154 DefinitelyCalled
= 0x3, /* 0011 */
155 // Kinds less or equal to NON_ERROR_STATUS are not considered errors.
156 NON_ERROR_STATUS
= DefinitelyCalled
,
157 // Parameter was not yet called.
158 NotCalled
= 0x5, /* 0101 */
159 // Parameter was not called at least on one path leading to this point,
160 // while there is also at least one path that it gets called.
161 MaybeCalled
= 0x7, /* 0111 */
162 // Parameter was not yet analyzed.
163 NotVisited
= 0x8, /* 1000 */
164 // We already reported a violation and stopped tracking calls for this
166 Reported
= 0x15, /* 1111 */
167 LLVM_MARK_AS_BITMASK_ENUM(/* LargestValue = */ Reported
)
170 constexpr ParameterStatus() = default;
171 /* implicit */ ParameterStatus(Kind K
) : StatusKind(K
) {
172 assert(!seenAnyCalls(K
) && "Can't initialize status without a call");
174 ParameterStatus(Kind K
, const Expr
*Call
) : StatusKind(K
), Call(Call
) {
175 assert(seenAnyCalls(K
) && "This kind is not supposed to have a call");
178 const Expr
&getCall() const {
179 assert(seenAnyCalls(getKind()) && "ParameterStatus doesn't have a call");
182 static bool seenAnyCalls(Kind K
) {
183 return (K
& DefinitelyCalled
) == DefinitelyCalled
&& K
!= Reported
;
185 bool seenAnyCalls() const { return seenAnyCalls(getKind()); }
187 static bool isErrorStatus(Kind K
) { return K
> NON_ERROR_STATUS
; }
188 bool isErrorStatus() const { return isErrorStatus(getKind()); }
190 Kind
getKind() const { return StatusKind
; }
192 void join(const ParameterStatus
&Other
) {
193 // If we have a pointer already, let's keep it.
194 // For the purposes of the analysis, it doesn't really matter
195 // which call we report.
197 // If we don't have a pointer, let's take whatever gets joined.
202 StatusKind
|= Other
.getKind();
205 bool operator==(const ParameterStatus
&Other
) const {
206 // We compare only kinds, pointers on their own is only additional
208 return getKind() == Other
.getKind();
212 // It would've been a perfect place to use llvm::PointerIntPair, but
213 // unfortunately NumLowBitsAvailable for clang::Expr had been reduced to 2.
214 Kind StatusKind
= NotVisited
;
215 const Expr
*Call
= nullptr;
218 /// State aggregates statuses of all tracked parameters.
221 State(unsigned Size
, ParameterStatus::Kind K
= ParameterStatus::NotVisited
)
222 : ParamData(Size
, K
) {}
224 /// Return status of a parameter with the given index.
226 ParameterStatus
&getStatusFor(unsigned Index
) { return ParamData
[Index
]; }
227 const ParameterStatus
&getStatusFor(unsigned Index
) const {
228 return ParamData
[Index
];
232 /// Return true if parameter with the given index can be called.
233 bool seenAnyCalls(unsigned Index
) const {
234 return getStatusFor(Index
).seenAnyCalls();
236 /// Return a reference that we consider a call.
238 /// Should only be used for parameters that can be called.
239 const Expr
&getCallFor(unsigned Index
) const {
240 return getStatusFor(Index
).getCall();
242 /// Return status kind of parameter with the given index.
243 ParameterStatus::Kind
getKindFor(unsigned Index
) const {
244 return getStatusFor(Index
).getKind();
247 bool isVisited() const {
248 return llvm::all_of(ParamData
, [](const ParameterStatus
&S
) {
249 return S
.getKind() != ParameterStatus::NotVisited
;
253 // Join other state into the current state.
254 void join(const State
&Other
) {
255 assert(ParamData
.size() == Other
.ParamData
.size() &&
256 "Couldn't join statuses with different sizes");
257 for (auto Pair
: llvm::zip(ParamData
, Other
.ParamData
)) {
258 std::get
<0>(Pair
).join(std::get
<1>(Pair
));
262 using iterator
= ParamSizedVector
<ParameterStatus
>::iterator
;
263 using const_iterator
= ParamSizedVector
<ParameterStatus
>::const_iterator
;
265 iterator
begin() { return ParamData
.begin(); }
266 iterator
end() { return ParamData
.end(); }
268 const_iterator
begin() const { return ParamData
.begin(); }
269 const_iterator
end() const { return ParamData
.end(); }
271 bool operator==(const State
&Other
) const {
272 return ParamData
== Other
.ParamData
;
276 ParamSizedVector
<ParameterStatus
> ParamData
;
279 /// A simple class that finds DeclRefExpr in the given expression.
281 /// However, we don't want to find ANY nested DeclRefExpr skipping whatever
282 /// expressions on our way. Only certain expressions considered "no-op"
283 /// for our task are indeed skipped.
285 : public ConstStmtVisitor
<DeclRefFinder
, const DeclRefExpr
*> {
287 /// Find a DeclRefExpr in the given expression.
289 /// In its most basic form (ShouldRetrieveFromComparisons == false),
290 /// this function can be simply reduced to the following question:
292 /// - If expression E is used as a function argument, could we say
293 /// that DeclRefExpr nested in E is used as an argument?
295 /// According to this rule, we can say that parens, casts and dereferencing
296 /// (dereferencing only applied to function pointers, but this is our case)
299 /// When we should look into comparisons the question changes to:
301 /// - If expression E is used as a condition, could we say that
302 /// DeclRefExpr is being checked?
304 /// And even though, these are two different questions, they have quite a lot
305 /// in common. Actually, we can say that whatever expression answers
306 /// positively the first question also fits the second question as well.
308 /// In addition, we skip binary operators == and !=, and unary opeartor !.
309 static const DeclRefExpr
*find(const Expr
*E
,
310 bool ShouldRetrieveFromComparisons
= false) {
311 return DeclRefFinder(ShouldRetrieveFromComparisons
).Visit(E
);
314 const DeclRefExpr
*VisitDeclRefExpr(const DeclRefExpr
*DR
) { return DR
; }
316 const DeclRefExpr
*VisitUnaryOperator(const UnaryOperator
*UO
) {
317 switch (UO
->getOpcode()) {
319 // We care about logical not only if we care about comparisons.
320 if (!ShouldRetrieveFromComparisons
)
323 // Function pointer/references can be dereferenced before a call.
324 // That doesn't make it, however, any different from a regular call.
325 // For this reason, dereference operation is a "no-op".
327 return Visit(UO
->getSubExpr());
333 const DeclRefExpr
*VisitBinaryOperator(const BinaryOperator
*BO
) {
334 if (!ShouldRetrieveFromComparisons
)
337 switch (BO
->getOpcode()) {
340 const DeclRefExpr
*LHS
= Visit(BO
->getLHS());
341 return LHS
? LHS
: Visit(BO
->getRHS());
348 const DeclRefExpr
*VisitOpaqueValueExpr(const OpaqueValueExpr
*OVE
) {
349 return Visit(OVE
->getSourceExpr());
352 const DeclRefExpr
*VisitCallExpr(const CallExpr
*CE
) {
353 if (!ShouldRetrieveFromComparisons
)
356 // We want to see through some of the boolean builtin functions
357 // that we are likely to see in conditions.
358 switch (CE
->getBuiltinCallee()) {
359 case Builtin::BI__builtin_expect
:
360 case Builtin::BI__builtin_expect_with_probability
: {
361 assert(CE
->getNumArgs() >= 2);
363 const DeclRefExpr
*Candidate
= Visit(CE
->getArg(0));
364 return Candidate
!= nullptr ? Candidate
: Visit(CE
->getArg(1));
367 case Builtin::BI__builtin_unpredictable
:
368 return Visit(CE
->getArg(0));
375 const DeclRefExpr
*VisitExpr(const Expr
*E
) {
376 // It is a fallback method that gets called whenever the actual type
377 // of the given expression is not covered.
379 // We first check if we have anything to skip. And then repeat the whole
380 // procedure for a nested expression instead.
381 const Expr
*DeclutteredExpr
= E
->IgnoreParenCasts();
382 return E
!= DeclutteredExpr
? Visit(DeclutteredExpr
) : nullptr;
386 DeclRefFinder(bool ShouldRetrieveFromComparisons
)
387 : ShouldRetrieveFromComparisons(ShouldRetrieveFromComparisons
) {}
389 bool ShouldRetrieveFromComparisons
;
392 const DeclRefExpr
*findDeclRefExpr(const Expr
*In
,
393 bool ShouldRetrieveFromComparisons
= false) {
394 return DeclRefFinder::find(In
, ShouldRetrieveFromComparisons
);
398 findReferencedParmVarDecl(const Expr
*In
,
399 bool ShouldRetrieveFromComparisons
= false) {
400 if (const DeclRefExpr
*DR
=
401 findDeclRefExpr(In
, ShouldRetrieveFromComparisons
)) {
402 return dyn_cast
<ParmVarDecl
>(DR
->getDecl());
408 /// Return conditions expression of a statement if it has one.
409 const Expr
*getCondition(const Stmt
*S
) {
414 if (const auto *If
= dyn_cast
<IfStmt
>(S
)) {
415 return If
->getCond();
417 if (const auto *Ternary
= dyn_cast
<AbstractConditionalOperator
>(S
)) {
418 return Ternary
->getCond();
424 /// A small helper class that collects all named identifiers in the given
425 /// expression. It traverses it recursively, so names from deeper levels
426 /// of the AST will end up in the results.
427 /// Results might have duplicate names, if this is a problem, convert to
428 /// string sets afterwards.
429 class NamesCollector
: public RecursiveASTVisitor
<NamesCollector
> {
431 static constexpr unsigned EXPECTED_NUMBER_OF_NAMES
= 5;
432 using NameCollection
=
433 llvm::SmallVector
<llvm::StringRef
, EXPECTED_NUMBER_OF_NAMES
>;
435 static NameCollection
collect(const Expr
*From
) {
437 Impl
.TraverseStmt(const_cast<Expr
*>(From
));
441 bool VisitDeclRefExpr(const DeclRefExpr
*E
) {
442 Result
.push_back(E
->getDecl()->getName());
446 bool VisitObjCPropertyRefExpr(const ObjCPropertyRefExpr
*E
) {
447 llvm::StringRef Name
;
449 if (E
->isImplicitProperty()) {
450 ObjCMethodDecl
*PropertyMethodDecl
= nullptr;
451 if (E
->isMessagingGetter()) {
452 PropertyMethodDecl
= E
->getImplicitPropertyGetter();
454 PropertyMethodDecl
= E
->getImplicitPropertySetter();
456 assert(PropertyMethodDecl
&&
457 "Implicit property must have associated declaration");
458 Name
= PropertyMethodDecl
->getSelector().getNameForSlot(0);
460 assert(E
->isExplicitProperty());
461 Name
= E
->getExplicitProperty()->getName();
464 Result
.push_back(Name
);
469 NamesCollector() = default;
470 NameCollection Result
;
473 /// Check whether the given expression mentions any of conventional names.
474 bool mentionsAnyOfConventionalNames(const Expr
*E
) {
475 NamesCollector::NameCollection MentionedNames
= NamesCollector::collect(E
);
477 return llvm::any_of(MentionedNames
, [](llvm::StringRef ConditionName
) {
479 CONVENTIONAL_CONDITIONS
,
480 [ConditionName
](const llvm::StringLiteral
&Conventional
) {
481 return ConditionName
.contains_insensitive(Conventional
);
486 /// Clarification is a simple pair of a reason why parameter is not called
487 /// on every path and a statement to blame.
488 struct Clarification
{
489 NeverCalledReason Reason
;
490 const Stmt
*Location
;
493 /// A helper class that can produce a clarification based on the given pair
495 class NotCalledClarifier
496 : public ConstStmtVisitor
<NotCalledClarifier
,
497 std::optional
<Clarification
>> {
499 /// The main entrypoint for the class, the function that tries to find the
500 /// clarification of how to explain which sub-path starts with a CFG edge
501 /// from Conditional to SuccWithoutCall.
503 /// This means that this function has one precondition:
504 /// SuccWithoutCall should be a successor block for Conditional.
506 /// Because clarification is not needed for non-trivial pairs of blocks
507 /// (i.e. SuccWithoutCall is not the only successor), it returns meaningful
508 /// results only for such cases. For this very reason, the parent basic
509 /// block, Conditional, is named that way, so it is clear what kind of
510 /// block is expected.
511 static std::optional
<Clarification
> clarify(const CFGBlock
*Conditional
,
512 const CFGBlock
*SuccWithoutCall
) {
513 if (const Stmt
*Terminator
= Conditional
->getTerminatorStmt()) {
514 return NotCalledClarifier
{Conditional
, SuccWithoutCall
}.Visit(Terminator
);
519 std::optional
<Clarification
> VisitIfStmt(const IfStmt
*If
) {
520 return VisitBranchingBlock(If
, NeverCalledReason::IfThen
);
523 std::optional
<Clarification
>
524 VisitAbstractConditionalOperator(const AbstractConditionalOperator
*Ternary
) {
525 return VisitBranchingBlock(Ternary
, NeverCalledReason::IfThen
);
528 std::optional
<Clarification
> VisitSwitchStmt(const SwitchStmt
*Switch
) {
529 const Stmt
*CaseToBlame
= SuccInQuestion
->getLabel();
531 // If interesting basic block is not labeled, it means that this
532 // basic block does not represent any of the cases.
533 return Clarification
{NeverCalledReason::SwitchSkipped
, Switch
};
536 for (const SwitchCase
*Case
= Switch
->getSwitchCaseList(); Case
;
537 Case
= Case
->getNextSwitchCase()) {
538 if (Case
== CaseToBlame
) {
539 return Clarification
{NeverCalledReason::Switch
, Case
};
543 llvm_unreachable("Found unexpected switch structure");
546 std::optional
<Clarification
> VisitForStmt(const ForStmt
*For
) {
547 return VisitBranchingBlock(For
, NeverCalledReason::LoopEntered
);
550 std::optional
<Clarification
> VisitWhileStmt(const WhileStmt
*While
) {
551 return VisitBranchingBlock(While
, NeverCalledReason::LoopEntered
);
554 std::optional
<Clarification
>
555 VisitBranchingBlock(const Stmt
*Terminator
, NeverCalledReason DefaultReason
) {
556 assert(Parent
->succ_size() == 2 &&
557 "Branching block should have exactly two successors");
558 unsigned SuccessorIndex
= getSuccessorIndex(Parent
, SuccInQuestion
);
559 NeverCalledReason ActualReason
=
560 updateForSuccessor(DefaultReason
, SuccessorIndex
);
561 return Clarification
{ActualReason
, Terminator
};
564 std::optional
<Clarification
> VisitBinaryOperator(const BinaryOperator
*) {
565 // We don't want to report on short-curcuit logical operations.
569 std::optional
<Clarification
> VisitStmt(const Stmt
*Terminator
) {
570 // If we got here, we didn't have a visit function for more derived
571 // classes of statement that this terminator actually belongs to.
573 // This is not a good scenario and should not happen in practice, but
574 // at least we'll warn the user.
575 return Clarification
{NeverCalledReason::FallbackReason
, Terminator
};
578 static unsigned getSuccessorIndex(const CFGBlock
*Parent
,
579 const CFGBlock
*Child
) {
580 CFGBlock::const_succ_iterator It
= llvm::find(Parent
->succs(), Child
);
581 assert(It
!= Parent
->succ_end() &&
582 "Given blocks should be in parent-child relationship");
583 return It
- Parent
->succ_begin();
586 static NeverCalledReason
587 updateForSuccessor(NeverCalledReason ReasonForTrueBranch
,
588 unsigned SuccessorIndex
) {
589 assert(SuccessorIndex
<= 1);
591 static_cast<unsigned>(ReasonForTrueBranch
) + SuccessorIndex
;
593 static_cast<unsigned>(NeverCalledReason::LARGEST_VALUE
));
594 return static_cast<NeverCalledReason
>(RawReason
);
598 NotCalledClarifier(const CFGBlock
*Parent
, const CFGBlock
*SuccInQuestion
)
599 : Parent(Parent
), SuccInQuestion(SuccInQuestion
) {}
601 const CFGBlock
*Parent
, *SuccInQuestion
;
604 class CalledOnceChecker
: public ConstStmtVisitor
<CalledOnceChecker
> {
606 static void check(AnalysisDeclContext
&AC
, CalledOnceCheckHandler
&Handler
,
607 bool CheckConventionalParameters
) {
608 CalledOnceChecker(AC
, Handler
, CheckConventionalParameters
).check();
612 CalledOnceChecker(AnalysisDeclContext
&AC
, CalledOnceCheckHandler
&Handler
,
613 bool CheckConventionalParameters
)
614 : FunctionCFG(*AC
.getCFG()), AC(AC
), Handler(Handler
),
615 CheckConventionalParameters(CheckConventionalParameters
),
617 initDataStructures();
618 assert((size() == 0 || !States
.empty()) &&
619 "Data structures are inconsistent");
622 //===----------------------------------------------------------------------===//
623 // Initializing functions
624 //===----------------------------------------------------------------------===//
626 void initDataStructures() {
627 const Decl
*AnalyzedDecl
= AC
.getDecl();
629 if (const auto *Function
= dyn_cast
<FunctionDecl
>(AnalyzedDecl
)) {
630 findParamsToTrack(Function
);
631 } else if (const auto *Method
= dyn_cast
<ObjCMethodDecl
>(AnalyzedDecl
)) {
632 findParamsToTrack(Method
);
633 } else if (const auto *Block
= dyn_cast
<BlockDecl
>(AnalyzedDecl
)) {
634 findCapturesToTrack(Block
);
635 findParamsToTrack(Block
);
638 // Have something to track, let's init states for every block from the CFG.
641 CFGSizedVector
<State
>(FunctionCFG
.getNumBlockIDs(), State(size()));
645 void findCapturesToTrack(const BlockDecl
*Block
) {
646 for (const auto &Capture
: Block
->captures()) {
647 if (const auto *P
= dyn_cast
<ParmVarDecl
>(Capture
.getVariable())) {
648 // Parameter DeclContext is its owning function or method.
649 const DeclContext
*ParamContext
= P
->getDeclContext();
650 if (shouldBeCalledOnce(ParamContext
, P
)) {
651 TrackedParams
.push_back(P
);
657 template <class FunctionLikeDecl
>
658 void findParamsToTrack(const FunctionLikeDecl
*Function
) {
659 for (unsigned Index
: llvm::seq
<unsigned>(0u, Function
->param_size())) {
660 if (shouldBeCalledOnce(Function
, Index
)) {
661 TrackedParams
.push_back(Function
->getParamDecl(Index
));
666 //===----------------------------------------------------------------------===//
667 // Main logic 'check' functions
668 //===----------------------------------------------------------------------===//
671 // Nothing to check here: we don't have marked parameters.
672 if (size() == 0 || isPossiblyEmptyImpl())
676 llvm::none_of(States
, [](const State
&S
) { return S
.isVisited(); }) &&
677 "None of the blocks should be 'visited' before the analysis");
679 // For our task, both backward and forward approaches suite well.
680 // However, in order to report better diagnostics, we decided to go with
681 // backward analysis.
683 // Let's consider the following CFG and how forward and backward analyses
686 // FORWARD: | BACKWARD:
688 // +---------+ | +-----------+
689 // | if | | |MaybeCalled|
690 // +---------+ | +-----------+
691 // |NotCalled| | | if |
692 // +---------+ | +-----------+
694 // #2 / \ #3 | #2 / \ #3
695 // +----------------+ +---------+ | +----------------+ +---------+
696 // | foo() | | ... | | |DefinitelyCalled| |NotCalled|
697 // +----------------+ +---------+ | +----------------+ +---------+
698 // |DefinitelyCalled| |NotCalled| | | foo() | | ... |
699 // +----------------+ +---------+ | +----------------+ +---------+
702 // +-----------+ | +---------+
703 // | ... | | |NotCalled|
704 // +-----------+ | +---------+
705 // |MaybeCalled| | | ... |
706 // +-----------+ | +---------+
708 // The most natural way to report lacking call in the block #3 would be to
709 // message that the false branch of the if statement in the block #1 doesn't
710 // have a call. And while with the forward approach we'll need to find a
711 // least common ancestor or something like that to find the 'if' to blame,
712 // backward analysis gives it to us out of the box.
713 BackwardDataflowWorklist
Worklist(FunctionCFG
, AC
);
716 const CFGBlock
*Exit
= &FunctionCFG
.getExit();
717 assignState(Exit
, State(size(), ParameterStatus::NotCalled
));
718 Worklist
.enqueuePredecessors(Exit
);
720 while (const CFGBlock
*BB
= Worklist
.dequeue()) {
721 assert(BB
&& "Worklist should filter out null blocks");
723 assert(CurrentState
.isVisited() &&
724 "After the check, basic block should be visited");
726 // Traverse successor basic blocks if the status of this block
728 if (assignState(BB
, CurrentState
)) {
729 Worklist
.enqueuePredecessors(BB
);
733 // Check that we have all tracked parameters at the last block.
734 // As we are performing a backward version of the analysis,
735 // it should be the ENTRY block.
736 checkEntry(&FunctionCFG
.getEntry());
739 void check(const CFGBlock
*BB
) {
740 // We start with a state 'inherited' from all the successors.
741 CurrentState
= joinSuccessors(BB
);
742 assert(CurrentState
.isVisited() &&
743 "Shouldn't start with a 'not visited' state");
745 // This is the 'exit' situation, broken promises are probably OK
746 // in such scenarios.
747 if (BB
->hasNoReturnElement()) {
749 // This block still can have calls (even multiple calls) and
750 // for this reason there is no early return here.
753 // We use a backward dataflow propagation and for this reason we
754 // should traverse basic blocks bottom-up.
755 for (const CFGElement
&Element
: llvm::reverse(*BB
)) {
756 if (std::optional
<CFGStmt
> S
= Element
.getAs
<CFGStmt
>()) {
761 void check(const Stmt
*S
) { Visit(S
); }
763 void checkEntry(const CFGBlock
*Entry
) {
764 // We finalize this algorithm with the ENTRY block because
765 // we use a backward version of the analysis. This is where
766 // we can judge that some of the tracked parameters are not called on
767 // every path from ENTRY to EXIT.
769 const State
&EntryStatus
= getState(Entry
);
770 llvm::BitVector
NotCalledOnEveryPath(size(), false);
771 llvm::BitVector
NotUsedOnEveryPath(size(), false);
773 // Check if there are no calls of the marked parameter at all
774 for (const auto &IndexedStatus
: llvm::enumerate(EntryStatus
)) {
775 const ParmVarDecl
*Parameter
= getParameter(IndexedStatus
.index());
777 switch (IndexedStatus
.value().getKind()) {
778 case ParameterStatus::NotCalled
:
779 // If there were places where this parameter escapes (aka being used),
780 // we can provide a more useful diagnostic by pointing at the exact
781 // branches where it is not even mentioned.
782 if (!hasEverEscaped(IndexedStatus
.index())) {
783 // This parameter is was not used at all, so we should report the
784 // most generic version of the warning.
785 if (isCaptured(Parameter
)) {
786 // We want to specify that it was captured by the block.
787 Handler
.handleCapturedNeverCalled(Parameter
, AC
.getDecl(),
788 !isExplicitlyMarked(Parameter
));
790 Handler
.handleNeverCalled(Parameter
,
791 !isExplicitlyMarked(Parameter
));
794 // Mark it as 'interesting' to figure out which paths don't even
796 NotUsedOnEveryPath
[IndexedStatus
.index()] = true;
800 case ParameterStatus::MaybeCalled
:
801 // If we have 'maybe called' at this point, we have an error
802 // that there is at least one path where this parameter
805 // However, reporting the warning with only that information can be
806 // too vague for the users. For this reason, we mark such parameters
807 // as "interesting" for further analysis.
808 NotCalledOnEveryPath
[IndexedStatus
.index()] = true;
815 // Early exit if we don't have parameters for extra analysis...
816 if (NotCalledOnEveryPath
.none() && NotUsedOnEveryPath
.none() &&
817 // ... or if we've seen variables with cleanup functions.
818 // We can't reason that we've seen every path in this case,
819 // and thus abandon reporting any warnings that imply that.
820 !FunctionHasCleanupVars
)
823 // We are looking for a pair of blocks A, B so that the following is true:
824 // * A is a predecessor of B
825 // * B is marked as NotCalled
826 // * A has at least one successor marked as either
827 // Escaped or DefinitelyCalled
829 // In that situation, it is guaranteed that B is the first block of the path
830 // where the user doesn't call or use parameter in question.
832 // For this reason, branch A -> B can be used for reporting.
834 // This part of the algorithm is guarded by a condition that the function
835 // does indeed have a violation of contract. For this reason, we can
836 // spend more time to find a good spot to place the warning.
838 // The following algorithm has the worst case complexity of O(V + E),
839 // where V is the number of basic blocks in FunctionCFG,
840 // E is the number of edges between blocks in FunctionCFG.
841 for (const CFGBlock
*BB
: FunctionCFG
) {
845 const State
&BlockState
= getState(BB
);
847 for (unsigned Index
: llvm::seq(0u, size())) {
848 // We don't want to use 'isLosingCall' here because we want to report
849 // the following situation as well:
853 // MaybeCalled NotCalled
855 // Even though successor is not 'DefinitelyCalled', it is still useful
856 // to report it, it is still a path without a call.
857 if (NotCalledOnEveryPath
[Index
] &&
858 BlockState
.getKindFor(Index
) == ParameterStatus::MaybeCalled
) {
860 findAndReportNotCalledBranches(BB
, Index
);
861 } else if (NotUsedOnEveryPath
[Index
] &&
862 isLosingEscape(BlockState
, BB
, Index
)) {
864 findAndReportNotCalledBranches(BB
, Index
, /* IsEscape = */ true);
870 /// Check potential call of a tracked parameter.
871 void checkDirectCall(const CallExpr
*Call
) {
872 if (auto Index
= getIndexOfCallee(Call
)) {
873 processCallFor(*Index
, Call
);
877 /// Check the call expression for being an indirect call of one of the tracked
878 /// parameters. It is indirect in the sense that this particular call is not
879 /// calling the parameter itself, but rather uses it as the argument.
880 template <class CallLikeExpr
>
881 void checkIndirectCall(const CallLikeExpr
*CallOrMessage
) {
882 // CallExpr::arguments does not interact nicely with llvm::enumerate.
883 llvm::ArrayRef
<const Expr
*> Arguments
=
884 llvm::ArrayRef(CallOrMessage
->getArgs(), CallOrMessage
->getNumArgs());
886 // Let's check if any of the call arguments is a point of interest.
887 for (const auto &Argument
: llvm::enumerate(Arguments
)) {
888 if (auto Index
= getIndexOfExpression(Argument
.value())) {
889 if (shouldBeCalledOnce(CallOrMessage
, Argument
.index())) {
890 // If the corresponding parameter is marked as 'called_once' we should
891 // consider it as a call.
892 processCallFor(*Index
, CallOrMessage
);
894 // Otherwise, we mark this parameter as escaped, which can be
895 // interpreted both as called or not called depending on the context.
896 processEscapeFor(*Index
);
898 // Otherwise, let's keep the state as it is.
903 /// Process call of the parameter with the given index
904 void processCallFor(unsigned Index
, const Expr
*Call
) {
905 ParameterStatus
&CurrentParamStatus
= CurrentState
.getStatusFor(Index
);
907 if (CurrentParamStatus
.seenAnyCalls()) {
909 // At this point, this parameter was called, so this is a second call.
910 const ParmVarDecl
*Parameter
= getParameter(Index
);
911 Handler
.handleDoubleCall(
912 Parameter
, &CurrentState
.getCallFor(Index
), Call
,
913 !isExplicitlyMarked(Parameter
),
914 // We are sure that the second call is definitely
915 // going to happen if the status is 'DefinitelyCalled'.
916 CurrentParamStatus
.getKind() == ParameterStatus::DefinitelyCalled
);
918 // Mark this parameter as already reported on, so we don't repeat
920 CurrentParamStatus
= ParameterStatus::Reported
;
922 } else if (CurrentParamStatus
.getKind() != ParameterStatus::Reported
) {
923 // If we didn't report anything yet, let's mark this parameter
925 ParameterStatus
Called(ParameterStatus::DefinitelyCalled
, Call
);
926 CurrentParamStatus
= Called
;
930 /// Process escape of the parameter with the given index
931 void processEscapeFor(unsigned Index
) {
932 ParameterStatus
&CurrentParamStatus
= CurrentState
.getStatusFor(Index
);
934 // Escape overrides whatever error we think happened.
935 if (CurrentParamStatus
.isErrorStatus()) {
936 CurrentParamStatus
= ParameterStatus::Escaped
;
940 void findAndReportNotCalledBranches(const CFGBlock
*Parent
, unsigned Index
,
941 bool IsEscape
= false) {
942 for (const CFGBlock
*Succ
: Parent
->succs()) {
946 if (getState(Succ
).getKindFor(Index
) == ParameterStatus::NotCalled
) {
947 assert(Parent
->succ_size() >= 2 &&
948 "Block should have at least two successors at this point");
949 if (auto Clarification
= NotCalledClarifier::clarify(Parent
, Succ
)) {
950 const ParmVarDecl
*Parameter
= getParameter(Index
);
951 Handler
.handleNeverCalled(
952 Parameter
, AC
.getDecl(), Clarification
->Location
,
953 Clarification
->Reason
, !IsEscape
, !isExplicitlyMarked(Parameter
));
959 //===----------------------------------------------------------------------===//
960 // Predicate functions to check parameters
961 //===----------------------------------------------------------------------===//
963 /// Return true if parameter is explicitly marked as 'called_once'.
964 static bool isExplicitlyMarked(const ParmVarDecl
*Parameter
) {
965 return Parameter
->hasAttr
<CalledOnceAttr
>();
968 /// Return true if the given name matches conventional pattens.
969 static bool isConventional(llvm::StringRef Name
) {
970 return llvm::count(CONVENTIONAL_NAMES
, Name
) != 0;
973 /// Return true if the given name has conventional suffixes.
974 static bool hasConventionalSuffix(llvm::StringRef Name
) {
975 return llvm::any_of(CONVENTIONAL_SUFFIXES
, [Name
](llvm::StringRef Suffix
) {
976 return Name
.ends_with(Suffix
);
980 /// Return true if the given type can be used for conventional parameters.
981 static bool isConventional(QualType Ty
) {
982 if (!Ty
->isBlockPointerType()) {
986 QualType BlockType
= Ty
->castAs
<BlockPointerType
>()->getPointeeType();
987 // Completion handlers should have a block type with void return type.
988 return BlockType
->castAs
<FunctionType
>()->getReturnType()->isVoidType();
991 /// Return true if the only parameter of the function is conventional.
992 static bool isOnlyParameterConventional(const FunctionDecl
*Function
) {
993 IdentifierInfo
*II
= Function
->getIdentifier();
994 return Function
->getNumParams() == 1 && II
&&
995 hasConventionalSuffix(II
->getName());
998 /// Return true/false if 'swift_async' attribute states that the given
999 /// parameter is conventionally called once.
1000 /// Return std::nullopt if the given declaration doesn't have 'swift_async'
1002 static std::optional
<bool> isConventionalSwiftAsync(const Decl
*D
,
1003 unsigned ParamIndex
) {
1004 if (const SwiftAsyncAttr
*A
= D
->getAttr
<SwiftAsyncAttr
>()) {
1005 if (A
->getKind() == SwiftAsyncAttr::None
) {
1009 return A
->getCompletionHandlerIndex().getASTIndex() == ParamIndex
;
1011 return std::nullopt
;
1014 /// Return true if the specified selector represents init method.
1015 static bool isInitMethod(Selector MethodSelector
) {
1016 return MethodSelector
.getMethodFamily() == OMF_init
;
1019 /// Return true if the specified selector piece matches conventions.
1020 static bool isConventionalSelectorPiece(Selector MethodSelector
,
1021 unsigned PieceIndex
,
1022 QualType PieceType
) {
1023 if (!isConventional(PieceType
) || isInitMethod(MethodSelector
)) {
1027 if (MethodSelector
.getNumArgs() == 1) {
1028 assert(PieceIndex
== 0);
1029 return hasConventionalSuffix(MethodSelector
.getNameForSlot(0));
1032 llvm::StringRef PieceName
= MethodSelector
.getNameForSlot(PieceIndex
);
1033 return isConventional(PieceName
) || hasConventionalSuffix(PieceName
);
1036 bool shouldBeCalledOnce(const ParmVarDecl
*Parameter
) const {
1037 return isExplicitlyMarked(Parameter
) ||
1038 (CheckConventionalParameters
&&
1039 (isConventional(Parameter
->getName()) ||
1040 hasConventionalSuffix(Parameter
->getName())) &&
1041 isConventional(Parameter
->getType()));
1044 bool shouldBeCalledOnce(const DeclContext
*ParamContext
,
1045 const ParmVarDecl
*Param
) {
1046 unsigned ParamIndex
= Param
->getFunctionScopeIndex();
1047 if (const auto *Function
= dyn_cast
<FunctionDecl
>(ParamContext
)) {
1048 return shouldBeCalledOnce(Function
, ParamIndex
);
1050 if (const auto *Method
= dyn_cast
<ObjCMethodDecl
>(ParamContext
)) {
1051 return shouldBeCalledOnce(Method
, ParamIndex
);
1053 return shouldBeCalledOnce(Param
);
1056 bool shouldBeCalledOnce(const BlockDecl
*Block
, unsigned ParamIndex
) const {
1057 return shouldBeCalledOnce(Block
->getParamDecl(ParamIndex
));
1060 bool shouldBeCalledOnce(const FunctionDecl
*Function
,
1061 unsigned ParamIndex
) const {
1062 if (ParamIndex
>= Function
->getNumParams()) {
1065 // 'swift_async' goes first and overrides anything else.
1066 if (auto ConventionalAsync
=
1067 isConventionalSwiftAsync(Function
, ParamIndex
)) {
1068 return *ConventionalAsync
;
1071 return shouldBeCalledOnce(Function
->getParamDecl(ParamIndex
)) ||
1072 (CheckConventionalParameters
&&
1073 isOnlyParameterConventional(Function
));
1076 bool shouldBeCalledOnce(const ObjCMethodDecl
*Method
,
1077 unsigned ParamIndex
) const {
1078 Selector MethodSelector
= Method
->getSelector();
1079 if (ParamIndex
>= MethodSelector
.getNumArgs()) {
1083 // 'swift_async' goes first and overrides anything else.
1084 if (auto ConventionalAsync
= isConventionalSwiftAsync(Method
, ParamIndex
)) {
1085 return *ConventionalAsync
;
1088 const ParmVarDecl
*Parameter
= Method
->getParamDecl(ParamIndex
);
1089 return shouldBeCalledOnce(Parameter
) ||
1090 (CheckConventionalParameters
&&
1091 isConventionalSelectorPiece(MethodSelector
, ParamIndex
,
1092 Parameter
->getType()));
1095 bool shouldBeCalledOnce(const CallExpr
*Call
, unsigned ParamIndex
) const {
1096 const FunctionDecl
*Function
= Call
->getDirectCallee();
1097 return Function
&& shouldBeCalledOnce(Function
, ParamIndex
);
1100 bool shouldBeCalledOnce(const ObjCMessageExpr
*Message
,
1101 unsigned ParamIndex
) const {
1102 const ObjCMethodDecl
*Method
= Message
->getMethodDecl();
1103 return Method
&& ParamIndex
< Method
->param_size() &&
1104 shouldBeCalledOnce(Method
, ParamIndex
);
1107 //===----------------------------------------------------------------------===//
1109 //===----------------------------------------------------------------------===//
1111 bool isCaptured(const ParmVarDecl
*Parameter
) const {
1112 if (const BlockDecl
*Block
= dyn_cast
<BlockDecl
>(AC
.getDecl())) {
1113 return Block
->capturesVariable(Parameter
);
1118 // Return a call site where the block is called exactly once or null otherwise
1119 const Expr
*getBlockGuaraneedCallSite(const BlockExpr
*Block
) const {
1120 ParentMap
&PM
= AC
.getParentMap();
1122 // We don't want to track the block through assignments and so on, instead
1123 // we simply see how the block used and if it's used directly in a call,
1124 // we decide based on call to what it is.
1126 // In order to do this, we go up the parents of the block looking for
1127 // a call or a message expressions. These might not be immediate parents
1128 // of the actual block expression due to casts and parens, so we skip them.
1129 for (const Stmt
*Prev
= Block
, *Current
= PM
.getParent(Block
);
1130 Current
!= nullptr; Prev
= Current
, Current
= PM
.getParent(Current
)) {
1131 // Skip no-op (for our case) operations.
1132 if (isa
<CastExpr
>(Current
) || isa
<ParenExpr
>(Current
))
1135 // At this point, Prev represents our block as an immediate child of the
1137 if (const auto *Call
= dyn_cast
<CallExpr
>(Current
)) {
1138 // It might be the call of the Block itself...
1139 if (Call
->getCallee() == Prev
)
1142 // ...or it can be an indirect call of the block.
1143 return shouldBlockArgumentBeCalledOnce(Call
, Prev
) ? Call
: nullptr;
1145 if (const auto *Message
= dyn_cast
<ObjCMessageExpr
>(Current
)) {
1146 return shouldBlockArgumentBeCalledOnce(Message
, Prev
) ? Message
1156 template <class CallLikeExpr
>
1157 bool shouldBlockArgumentBeCalledOnce(const CallLikeExpr
*CallOrMessage
,
1158 const Stmt
*BlockArgument
) const {
1159 // CallExpr::arguments does not interact nicely with llvm::enumerate.
1160 llvm::ArrayRef
<const Expr
*> Arguments
=
1161 llvm::ArrayRef(CallOrMessage
->getArgs(), CallOrMessage
->getNumArgs());
1163 for (const auto &Argument
: llvm::enumerate(Arguments
)) {
1164 if (Argument
.value() == BlockArgument
) {
1165 return shouldBlockArgumentBeCalledOnce(CallOrMessage
, Argument
.index());
1172 bool shouldBlockArgumentBeCalledOnce(const CallExpr
*Call
,
1173 unsigned ParamIndex
) const {
1174 const FunctionDecl
*Function
= Call
->getDirectCallee();
1175 return shouldBlockArgumentBeCalledOnce(Function
, ParamIndex
) ||
1176 shouldBeCalledOnce(Call
, ParamIndex
);
1179 bool shouldBlockArgumentBeCalledOnce(const ObjCMessageExpr
*Message
,
1180 unsigned ParamIndex
) const {
1181 // At the moment, we don't have any Obj-C methods we want to specifically
1183 return shouldBeCalledOnce(Message
, ParamIndex
);
1186 static bool shouldBlockArgumentBeCalledOnce(const FunctionDecl
*Function
,
1187 unsigned ParamIndex
) {
1188 // There is a list of important API functions that while not following
1189 // conventions nor being directly annotated, still guarantee that the
1190 // callback parameter will be called exactly once.
1192 // Here we check if this is the case.
1194 llvm::any_of(KNOWN_CALLED_ONCE_PARAMETERS
,
1195 [Function
, ParamIndex
](
1196 const KnownCalledOnceParameter
&Reference
) {
1197 return Reference
.FunctionName
==
1198 Function
->getName() &&
1199 Reference
.ParamIndex
== ParamIndex
;
1203 /// Return true if the analyzed function is actually a default implementation
1204 /// of the method that has to be overriden.
1206 /// These functions can have tracked parameters, but wouldn't call them
1207 /// because they are not designed to perform any meaningful actions.
1209 /// There are a couple of flavors of such default implementations:
1210 /// 1. Empty methods or methods with a single return statement
1211 /// 2. Methods that have one block with a call to no return function
1212 /// 3. Methods with only assertion-like operations
1213 bool isPossiblyEmptyImpl() const {
1214 if (!isa
<ObjCMethodDecl
>(AC
.getDecl())) {
1215 // We care only about functions that are not supposed to be called.
1216 // Only methods can be overriden.
1220 // Case #1 (without return statements)
1221 if (FunctionCFG
.size() == 2) {
1222 // Method has only two blocks: ENTRY and EXIT.
1223 // This is equivalent to empty function.
1228 if (FunctionCFG
.size() == 3) {
1229 const CFGBlock
&Entry
= FunctionCFG
.getEntry();
1230 if (Entry
.succ_empty()) {
1234 const CFGBlock
*OnlyBlock
= *Entry
.succ_begin();
1235 // Method has only one block, let's see if it has a no-return
1237 if (OnlyBlock
&& OnlyBlock
->hasNoReturnElement()) {
1240 // Fallthrough, CFGs with only one block can fall into #1 and #3 as well.
1243 // Cases #1 (return statements) and #3.
1245 // It is hard to detect that something is an assertion or came
1246 // from assertion. Here we use a simple heuristic:
1248 // - If it came from a macro, it can be an assertion.
1250 // Additionally, we can't assume a number of basic blocks or the CFG's
1251 // structure because assertions might include loops and conditions.
1252 return llvm::all_of(FunctionCFG
, [](const CFGBlock
*BB
) {
1254 // Unreachable blocks are totally fine.
1258 // Return statements can have sub-expressions that are represented as
1259 // separate statements of a basic block. We should allow this.
1260 // This parent map will be initialized with a parent tree for all
1261 // subexpressions of the block's return statement (if it has one).
1262 std::unique_ptr
<ParentMap
> ReturnChildren
;
1264 return llvm::all_of(
1265 llvm::reverse(*BB
), // we should start with return statements, if we
1266 // have any, i.e. from the bottom of the block
1267 [&ReturnChildren
](const CFGElement
&Element
) {
1268 if (std::optional
<CFGStmt
> S
= Element
.getAs
<CFGStmt
>()) {
1269 const Stmt
*SuspiciousStmt
= S
->getStmt();
1271 if (isa
<ReturnStmt
>(SuspiciousStmt
)) {
1272 // Let's initialize this structure to test whether
1273 // some further statement is a part of this return.
1274 ReturnChildren
= std::make_unique
<ParentMap
>(
1275 const_cast<Stmt
*>(SuspiciousStmt
));
1276 // Return statements are allowed as part of #1.
1280 return SuspiciousStmt
->getBeginLoc().isMacroID() ||
1282 ReturnChildren
->hasParent(SuspiciousStmt
));
1289 /// Check if parameter with the given index has ever escaped.
1290 bool hasEverEscaped(unsigned Index
) const {
1291 return llvm::any_of(States
, [Index
](const State
&StateForOneBB
) {
1292 return StateForOneBB
.getKindFor(Index
) == ParameterStatus::Escaped
;
1296 /// Return status stored for the given basic block.
1298 State
&getState(const CFGBlock
*BB
) {
1300 return States
[BB
->getBlockID()];
1302 const State
&getState(const CFGBlock
*BB
) const {
1304 return States
[BB
->getBlockID()];
1308 /// Assign status to the given basic block.
1310 /// Returns true when the stored status changed.
1311 bool assignState(const CFGBlock
*BB
, const State
&ToAssign
) {
1312 State
&Current
= getState(BB
);
1313 if (Current
== ToAssign
) {
1321 /// Join all incoming statuses for the given basic block.
1322 State
joinSuccessors(const CFGBlock
*BB
) const {
1324 llvm::make_filter_range(BB
->succs(), [this](const CFGBlock
*Succ
) {
1325 return Succ
&& this->getState(Succ
).isVisited();
1327 // We came to this block from somewhere after all.
1328 assert(!Succs
.empty() &&
1329 "Basic block should have at least one visited successor");
1331 State Result
= getState(*Succs
.begin());
1333 for (const CFGBlock
*Succ
: llvm::drop_begin(Succs
, 1)) {
1334 Result
.join(getState(Succ
));
1337 if (const Expr
*Condition
= getCondition(BB
->getTerminatorStmt())) {
1338 handleConditional(BB
, Condition
, Result
);
1344 void handleConditional(const CFGBlock
*BB
, const Expr
*Condition
,
1345 State
&ToAlter
) const {
1346 handleParameterCheck(BB
, Condition
, ToAlter
);
1347 if (SuppressOnConventionalErrorPaths
) {
1348 handleConventionalCheck(BB
, Condition
, ToAlter
);
1352 void handleParameterCheck(const CFGBlock
*BB
, const Expr
*Condition
,
1353 State
&ToAlter
) const {
1354 // In this function, we try to deal with the following pattern:
1359 // It's not good to show a warning here because clearly 'parameter'
1360 // couldn't and shouldn't be called on the 'else' path.
1362 // Let's check if this if statement has a check involving one of
1363 // the tracked parameters.
1364 if (const ParmVarDecl
*Parameter
= findReferencedParmVarDecl(
1366 /* ShouldRetrieveFromComparisons = */ true)) {
1367 if (const auto Index
= getIndex(*Parameter
)) {
1368 ParameterStatus
&CurrentStatus
= ToAlter
.getStatusFor(*Index
);
1370 // We don't want to deep dive into semantics of the check and
1371 // figure out if that check was for null or something else.
1372 // We simply trust the user that they know what they are doing.
1374 // For this reason, in the following loop we look for the
1375 // best-looking option.
1376 for (const CFGBlock
*Succ
: BB
->succs()) {
1380 const ParameterStatus
&StatusInSucc
=
1381 getState(Succ
).getStatusFor(*Index
);
1383 if (StatusInSucc
.isErrorStatus()) {
1387 // Let's use this status instead.
1388 CurrentStatus
= StatusInSucc
;
1390 if (StatusInSucc
.getKind() == ParameterStatus::DefinitelyCalled
) {
1391 // This is the best option to have and we already found it.
1395 // If we found 'Escaped' first, we still might find 'DefinitelyCalled'
1396 // on the other branch. And we prefer the latter.
1402 void handleConventionalCheck(const CFGBlock
*BB
, const Expr
*Condition
,
1403 State
&ToAlter
) const {
1404 // Even when the analysis is technically correct, it is a widespread pattern
1405 // not to call completion handlers in some scenarios. These usually have
1406 // typical conditional names, such as 'error' or 'cancel'.
1407 if (!mentionsAnyOfConventionalNames(Condition
)) {
1411 for (const auto &IndexedStatus
: llvm::enumerate(ToAlter
)) {
1412 const ParmVarDecl
*Parameter
= getParameter(IndexedStatus
.index());
1413 // Conventions do not apply to explicitly marked parameters.
1414 if (isExplicitlyMarked(Parameter
)) {
1418 ParameterStatus
&CurrentStatus
= IndexedStatus
.value();
1419 // If we did find that on one of the branches the user uses the callback
1420 // and doesn't on the other path, we believe that they know what they are
1421 // doing and trust them.
1423 // There are two possible scenarios for that:
1424 // 1. Current status is 'MaybeCalled' and one of the branches is
1425 // 'DefinitelyCalled'
1426 // 2. Current status is 'NotCalled' and one of the branches is 'Escaped'
1427 if (isLosingCall(ToAlter
, BB
, IndexedStatus
.index()) ||
1428 isLosingEscape(ToAlter
, BB
, IndexedStatus
.index())) {
1429 CurrentStatus
= ParameterStatus::Escaped
;
1434 bool isLosingCall(const State
&StateAfterJoin
, const CFGBlock
*JoinBlock
,
1435 unsigned ParameterIndex
) const {
1436 // Let's check if the block represents DefinitelyCalled -> MaybeCalled
1438 return isLosingJoin(StateAfterJoin
, JoinBlock
, ParameterIndex
,
1439 ParameterStatus::MaybeCalled
,
1440 ParameterStatus::DefinitelyCalled
);
1443 bool isLosingEscape(const State
&StateAfterJoin
, const CFGBlock
*JoinBlock
,
1444 unsigned ParameterIndex
) const {
1445 // Let's check if the block represents Escaped -> NotCalled transition.
1446 return isLosingJoin(StateAfterJoin
, JoinBlock
, ParameterIndex
,
1447 ParameterStatus::NotCalled
, ParameterStatus::Escaped
);
1450 bool isLosingJoin(const State
&StateAfterJoin
, const CFGBlock
*JoinBlock
,
1451 unsigned ParameterIndex
, ParameterStatus::Kind AfterJoin
,
1452 ParameterStatus::Kind BeforeJoin
) const {
1453 assert(!ParameterStatus::isErrorStatus(BeforeJoin
) &&
1454 ParameterStatus::isErrorStatus(AfterJoin
) &&
1455 "It's not a losing join if statuses do not represent "
1456 "correct-to-error transition");
1458 const ParameterStatus
&CurrentStatus
=
1459 StateAfterJoin
.getStatusFor(ParameterIndex
);
1461 return CurrentStatus
.getKind() == AfterJoin
&&
1462 anySuccessorHasStatus(JoinBlock
, ParameterIndex
, BeforeJoin
);
1465 /// Return true if any of the successors of the given basic block has
1466 /// a specified status for the given parameter.
1467 bool anySuccessorHasStatus(const CFGBlock
*Parent
, unsigned ParameterIndex
,
1468 ParameterStatus::Kind ToFind
) const {
1469 return llvm::any_of(
1470 Parent
->succs(), [this, ParameterIndex
, ToFind
](const CFGBlock
*Succ
) {
1471 return Succ
&& getState(Succ
).getKindFor(ParameterIndex
) == ToFind
;
1475 /// Check given expression that was discovered to escape.
1476 void checkEscapee(const Expr
*E
) {
1477 if (const ParmVarDecl
*Parameter
= findReferencedParmVarDecl(E
)) {
1478 checkEscapee(*Parameter
);
1482 /// Check given parameter that was discovered to escape.
1483 void checkEscapee(const ParmVarDecl
&Parameter
) {
1484 if (auto Index
= getIndex(Parameter
)) {
1485 processEscapeFor(*Index
);
1489 /// Mark all parameters in the current state as 'no-return'.
1490 void markNoReturn() {
1491 for (ParameterStatus
&PS
: CurrentState
) {
1492 PS
= ParameterStatus::NoReturn
;
1496 /// Check if the given assignment represents suppression and act on it.
1497 void checkSuppression(const BinaryOperator
*Assignment
) {
1498 // Suppression has the following form:
1500 // 0 can be of any form (NULL, nil, etc.)
1501 if (auto Index
= getIndexOfExpression(Assignment
->getLHS())) {
1503 // We don't care what is written in the RHS, it could be whatever
1504 // we can interpret as 0.
1506 Assignment
->getRHS()->IgnoreParenCasts()->getIntegerConstantExpr(
1507 AC
.getASTContext())) {
1509 ParameterStatus
&CurrentParamStatus
= CurrentState
.getStatusFor(*Index
);
1511 if (0 == *Constant
&& CurrentParamStatus
.seenAnyCalls()) {
1512 // Even though this suppression mechanism is introduced to tackle
1513 // false positives for multiple calls, the fact that the user has
1514 // to use suppression can also tell us that we couldn't figure out
1515 // how different paths cancel each other out. And if that is true,
1516 // we will most certainly have false positives about parameters not
1517 // being called on certain paths.
1519 // For this reason, we abandon tracking this parameter altogether.
1520 CurrentParamStatus
= ParameterStatus::Reported
;
1527 //===----------------------------------------------------------------------===//
1528 // Tree traversal methods
1529 //===----------------------------------------------------------------------===//
1531 void VisitCallExpr(const CallExpr
*Call
) {
1532 // This call might be a direct call, i.e. a parameter call...
1533 checkDirectCall(Call
);
1534 // ... or an indirect call, i.e. when parameter is an argument.
1535 checkIndirectCall(Call
);
1538 void VisitObjCMessageExpr(const ObjCMessageExpr
*Message
) {
1539 // The most common situation that we are defending against here is
1540 // copying a tracked parameter.
1541 if (const Expr
*Receiver
= Message
->getInstanceReceiver()) {
1542 checkEscapee(Receiver
);
1544 // Message expressions unlike calls, could not be direct.
1545 checkIndirectCall(Message
);
1548 void VisitBlockExpr(const BlockExpr
*Block
) {
1549 // Block expressions are tricky. It is a very common practice to capture
1550 // completion handlers by blocks and use them there.
1551 // For this reason, it is important to analyze blocks and report warnings
1552 // for completion handler misuse in blocks.
1554 // However, it can be quite difficult to track how the block itself is being
1555 // used. The full precise anlysis of that will be similar to alias analysis
1556 // for completion handlers and can be too heavyweight for a compile-time
1557 // diagnostic. Instead, we judge about the immediate use of the block.
1559 // Here, we try to find a call expression where we know due to conventions,
1560 // annotations, or other reasons that the block is called once and only
1562 const Expr
*CalledOnceCallSite
= getBlockGuaraneedCallSite(Block
);
1564 // We need to report this information to the handler because in the
1565 // situation when we know that the block is called exactly once, we can be
1566 // stricter in terms of reported diagnostics.
1567 if (CalledOnceCallSite
) {
1568 Handler
.handleBlockThatIsGuaranteedToBeCalledOnce(Block
->getBlockDecl());
1570 Handler
.handleBlockWithNoGuarantees(Block
->getBlockDecl());
1573 for (const auto &Capture
: Block
->getBlockDecl()->captures()) {
1574 if (const auto *Param
= dyn_cast
<ParmVarDecl
>(Capture
.getVariable())) {
1575 if (auto Index
= getIndex(*Param
)) {
1576 if (CalledOnceCallSite
) {
1577 // The call site of a block can be considered a call site of the
1578 // captured parameter we track.
1579 processCallFor(*Index
, CalledOnceCallSite
);
1581 // We still should consider this block as an escape for parameter,
1582 // if we don't know about its call site or the number of time it
1584 processEscapeFor(*Index
);
1591 void VisitBinaryOperator(const BinaryOperator
*Op
) {
1592 if (Op
->getOpcode() == clang::BO_Assign
) {
1593 // Let's check if one of the tracked parameters is assigned into
1594 // something, and if it is we don't want to track extra variables, so we
1595 // consider it as an escapee.
1596 checkEscapee(Op
->getRHS());
1598 // Let's check whether this assignment is a suppression.
1599 checkSuppression(Op
);
1603 void VisitDeclStmt(const DeclStmt
*DS
) {
1604 // Variable initialization is not assignment and should be handled
1607 // Multiple declarations can be a part of declaration statement.
1608 for (const auto *Declaration
: DS
->getDeclGroup()) {
1609 if (const auto *Var
= dyn_cast
<VarDecl
>(Declaration
)) {
1610 if (Var
->getInit()) {
1611 checkEscapee(Var
->getInit());
1614 if (Var
->hasAttr
<CleanupAttr
>()) {
1615 FunctionHasCleanupVars
= true;
1621 void VisitCStyleCastExpr(const CStyleCastExpr
*Cast
) {
1622 // We consider '(void)parameter' as a manual no-op escape.
1623 // It should be used to explicitly tell the analysis that this parameter
1624 // is intentionally not called on this path.
1625 if (Cast
->getType().getCanonicalType()->isVoidType()) {
1626 checkEscapee(Cast
->getSubExpr());
1630 void VisitObjCAtThrowStmt(const ObjCAtThrowStmt
*) {
1631 // It is OK not to call marked parameters on exceptional paths.
1636 unsigned size() const { return TrackedParams
.size(); }
1638 std::optional
<unsigned> getIndexOfCallee(const CallExpr
*Call
) const {
1639 return getIndexOfExpression(Call
->getCallee());
1642 std::optional
<unsigned> getIndexOfExpression(const Expr
*E
) const {
1643 if (const ParmVarDecl
*Parameter
= findReferencedParmVarDecl(E
)) {
1644 return getIndex(*Parameter
);
1647 return std::nullopt
;
1650 std::optional
<unsigned> getIndex(const ParmVarDecl
&Parameter
) const {
1651 // Expected number of parameters that we actually track is 1.
1653 // Also, the maximum number of declared parameters could not be on a scale
1654 // of hundreds of thousands.
1656 // In this setting, linear search seems reasonable and even performs better
1658 ParamSizedVector
<const ParmVarDecl
*>::const_iterator It
=
1659 llvm::find(TrackedParams
, &Parameter
);
1661 if (It
!= TrackedParams
.end()) {
1662 return It
- TrackedParams
.begin();
1665 return std::nullopt
;
1668 const ParmVarDecl
*getParameter(unsigned Index
) const {
1669 assert(Index
< TrackedParams
.size());
1670 return TrackedParams
[Index
];
1673 const CFG
&FunctionCFG
;
1674 AnalysisDeclContext
&AC
;
1675 CalledOnceCheckHandler
&Handler
;
1676 bool CheckConventionalParameters
;
1677 // As of now, we turn this behavior off. So, we still are going to report
1678 // missing calls on paths that look like it was intentional.
1679 // Technically such reports are true positives, but they can make some users
1680 // grumpy because of the sheer number of warnings.
1681 // It can be turned back on if we decide that we want to have the other way
1683 bool SuppressOnConventionalErrorPaths
= false;
1685 // The user can annotate variable declarations with cleanup functions, which
1686 // essentially imposes a custom destructor logic on that variable.
1687 // It is possible to use it, however, to call tracked parameters on all exits
1688 // from the function. For this reason, we track the fact that the function
1689 // actually has these.
1690 bool FunctionHasCleanupVars
= false;
1693 ParamSizedVector
<const ParmVarDecl
*> TrackedParams
;
1694 CFGSizedVector
<State
> States
;
1697 } // end anonymous namespace
1700 void checkCalledOnceParameters(AnalysisDeclContext
&AC
,
1701 CalledOnceCheckHandler
&Handler
,
1702 bool CheckConventionalParameters
) {
1703 CalledOnceChecker::check(AC
, Handler
, CheckConventionalParameters
);
1705 } // end namespace clang