//===- BugReporterVisitors.cpp - Helpers for reporting bugs ---------------===// // // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. // See https://llvm.org/LICENSE.txt for license information. // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception // //===----------------------------------------------------------------------===// // // This file defines a set of BugReporter "visitors" which can be used to // enhance the diagnostics reported for a bug. // //===----------------------------------------------------------------------===// #include "clang/StaticAnalyzer/Core/BugReporter/BugReporterVisitors.h" #include "clang/AST/ASTContext.h" #include "clang/AST/Decl.h" #include "clang/AST/DeclBase.h" #include "clang/AST/DeclCXX.h" #include "clang/AST/Expr.h" #include "clang/AST/ExprCXX.h" #include "clang/AST/ExprObjC.h" #include "clang/AST/Stmt.h" #include "clang/AST/Type.h" #include "clang/ASTMatchers/ASTMatchFinder.h" #include "clang/Analysis/AnalysisDeclContext.h" #include "clang/Analysis/CFG.h" #include "clang/Analysis/CFGStmtMap.h" #include "clang/Analysis/ProgramPoint.h" #include "clang/Basic/IdentifierTable.h" #include "clang/Basic/LLVM.h" #include "clang/Basic/SourceLocation.h" #include "clang/Basic/SourceManager.h" #include "clang/Lex/Lexer.h" #include "clang/StaticAnalyzer/Core/AnalyzerOptions.h" #include "clang/StaticAnalyzer/Core/BugReporter/BugReporter.h" #include "clang/StaticAnalyzer/Core/BugReporter/PathDiagnostic.h" #include "clang/StaticAnalyzer/Core/PathSensitive/AnalysisManager.h" #include "clang/StaticAnalyzer/Core/PathSensitive/CallEvent.h" #include "clang/StaticAnalyzer/Core/PathSensitive/ExplodedGraph.h" #include "clang/StaticAnalyzer/Core/PathSensitive/ExprEngine.h" #include "clang/StaticAnalyzer/Core/PathSensitive/MemRegion.h" #include "clang/StaticAnalyzer/Core/PathSensitive/ProgramState.h" #include "clang/StaticAnalyzer/Core/PathSensitive/ProgramState_Fwd.h" #include "clang/StaticAnalyzer/Core/PathSensitive/SMTConv.h" #include "clang/StaticAnalyzer/Core/PathSensitive/SValBuilder.h" #include "clang/StaticAnalyzer/Core/PathSensitive/SVals.h" #include "clang/StaticAnalyzer/Core/PathSensitive/SubEngine.h" #include "llvm/ADT/ArrayRef.h" #include "llvm/ADT/None.h" #include "llvm/ADT/Optional.h" #include "llvm/ADT/STLExtras.h" #include "llvm/ADT/SmallPtrSet.h" #include "llvm/ADT/SmallString.h" #include "llvm/ADT/SmallVector.h" #include "llvm/ADT/StringExtras.h" #include "llvm/ADT/StringRef.h" #include "llvm/Support/Casting.h" #include "llvm/Support/ErrorHandling.h" #include "llvm/Support/raw_ostream.h" #include #include #include #include #include using namespace clang; using namespace ento; //===----------------------------------------------------------------------===// // Utility functions. //===----------------------------------------------------------------------===// static const Expr *peelOffPointerArithmetic(const BinaryOperator *B) { if (B->isAdditiveOp() && B->getType()->isPointerType()) { if (B->getLHS()->getType()->isPointerType()) { return B->getLHS(); } else if (B->getRHS()->getType()->isPointerType()) { return B->getRHS(); } } return nullptr; } /// Given that expression S represents a pointer that would be dereferenced, /// try to find a sub-expression from which the pointer came from. /// This is used for tracking down origins of a null or undefined value: /// "this is null because that is null because that is null" etc. /// We wipe away field and element offsets because they merely add offsets. /// We also wipe away all casts except lvalue-to-rvalue casts, because the /// latter represent an actual pointer dereference; however, we remove /// the final lvalue-to-rvalue cast before returning from this function /// because it demonstrates more clearly from where the pointer rvalue was /// loaded. Examples: /// x->y.z ==> x (lvalue) /// foo()->y.z ==> foo() (rvalue) const Expr *bugreporter::getDerefExpr(const Stmt *S) { const auto *E = dyn_cast(S); if (!E) return nullptr; while (true) { if (const auto *CE = dyn_cast(E)) { if (CE->getCastKind() == CK_LValueToRValue) { // This cast represents the load we're looking for. break; } E = CE->getSubExpr(); } else if (const auto *B = dyn_cast(E)) { // Pointer arithmetic: '*(x + 2)' -> 'x') etc. if (const Expr *Inner = peelOffPointerArithmetic(B)) { E = Inner; } else { // Probably more arithmetic can be pattern-matched here, // but for now give up. break; } } else if (const auto *U = dyn_cast(E)) { if (U->getOpcode() == UO_Deref || U->getOpcode() == UO_AddrOf || (U->isIncrementDecrementOp() && U->getType()->isPointerType())) { // Operators '*' and '&' don't actually mean anything. // We look at casts instead. E = U->getSubExpr(); } else { // Probably more arithmetic can be pattern-matched here, // but for now give up. break; } } // Pattern match for a few useful cases: a[0], p->f, *p etc. else if (const auto *ME = dyn_cast(E)) { E = ME->getBase(); } else if (const auto *IvarRef = dyn_cast(E)) { E = IvarRef->getBase(); } else if (const auto *AE = dyn_cast(E)) { E = AE->getBase(); } else if (const auto *PE = dyn_cast(E)) { E = PE->getSubExpr(); } else if (const auto *FE = dyn_cast(E)) { E = FE->getSubExpr(); } else { // Other arbitrary stuff. break; } } // Special case: remove the final lvalue-to-rvalue cast, but do not recurse // deeper into the sub-expression. This way we return the lvalue from which // our pointer rvalue was loaded. if (const auto *CE = dyn_cast(E)) if (CE->getCastKind() == CK_LValueToRValue) E = CE->getSubExpr(); return E; } //===----------------------------------------------------------------------===// // Definitions for bug reporter visitors. //===----------------------------------------------------------------------===// std::shared_ptr BugReporterVisitor::getEndPath(BugReporterContext &, const ExplodedNode *, BugReport &) { return nullptr; } void BugReporterVisitor::finalizeVisitor(BugReporterContext &, const ExplodedNode *, BugReport &) {} std::shared_ptr BugReporterVisitor::getDefaultEndPath( BugReporterContext &BRC, const ExplodedNode *EndPathNode, BugReport &BR) { PathDiagnosticLocation L = PathDiagnosticLocation::createEndOfPath(EndPathNode,BRC.getSourceManager()); const auto &Ranges = BR.getRanges(); // Only add the statement itself as a range if we didn't specify any // special ranges for this report. auto P = std::make_shared( L, BR.getDescription(), Ranges.begin() == Ranges.end()); for (SourceRange Range : Ranges) P->addRange(Range); return P; } /// \return name of the macro inside the location \p Loc. static StringRef getMacroName(SourceLocation Loc, BugReporterContext &BRC) { return Lexer::getImmediateMacroName( Loc, BRC.getSourceManager(), BRC.getASTContext().getLangOpts()); } /// \return Whether given spelling location corresponds to an expansion /// of a function-like macro. static bool isFunctionMacroExpansion(SourceLocation Loc, const SourceManager &SM) { if (!Loc.isMacroID()) return false; while (SM.isMacroArgExpansion(Loc)) Loc = SM.getImmediateExpansionRange(Loc).getBegin(); std::pair TLInfo = SM.getDecomposedLoc(Loc); SrcMgr::SLocEntry SE = SM.getSLocEntry(TLInfo.first); const SrcMgr::ExpansionInfo &EInfo = SE.getExpansion(); return EInfo.isFunctionMacroExpansion(); } /// \return Whether \c RegionOfInterest was modified at \p N, /// where \p ReturnState is a state associated with the return /// from the current frame. static bool wasRegionOfInterestModifiedAt( const SubRegion *RegionOfInterest, const ExplodedNode *N, SVal ValueAfter) { ProgramStateRef State = N->getState(); ProgramStateManager &Mgr = N->getState()->getStateManager(); if (!N->getLocationAs() && !N->getLocationAs() && !N->getLocationAs()) return false; // Writing into region of interest. if (auto PS = N->getLocationAs()) if (auto *BO = PS->getStmtAs()) if (BO->isAssignmentOp() && RegionOfInterest->isSubRegionOf( N->getSVal(BO->getLHS()).getAsRegion())) return true; // SVal after the state is possibly different. SVal ValueAtN = N->getState()->getSVal(RegionOfInterest); if (!Mgr.getSValBuilder().areEqual(State, ValueAtN, ValueAfter).isConstrainedTrue() && (!ValueAtN.isUndef() || !ValueAfter.isUndef())) return true; return false; } namespace { /// Put a diagnostic on return statement of all inlined functions /// for which the region of interest \p RegionOfInterest was passed into, /// but not written inside, and it has caused an undefined read or a null /// pointer dereference outside. class NoStoreFuncVisitor final : public BugReporterVisitor { const SubRegion *RegionOfInterest; MemRegionManager &MmrMgr; const SourceManager &SM; const PrintingPolicy &PP; /// Recursion limit for dereferencing fields when looking for the /// region of interest. /// The limit of two indicates that we will dereference fields only once. static const unsigned DEREFERENCE_LIMIT = 2; /// Frames writing into \c RegionOfInterest. /// This visitor generates a note only if a function does not write into /// a region of interest. This information is not immediately available /// by looking at the node associated with the exit from the function /// (usually the return statement). To avoid recomputing the same information /// many times (going up the path for each node and checking whether the /// region was written into) we instead lazily compute the /// stack frames along the path which write into the region of interest. llvm::SmallPtrSet FramesModifyingRegion; llvm::SmallPtrSet FramesModifyingCalculated; using RegionVector = SmallVector; public: NoStoreFuncVisitor(const SubRegion *R) : RegionOfInterest(R), MmrMgr(*R->getMemRegionManager()), SM(MmrMgr.getContext().getSourceManager()), PP(MmrMgr.getContext().getPrintingPolicy()) {} void Profile(llvm::FoldingSetNodeID &ID) const override { static int Tag = 0; ID.AddPointer(&Tag); ID.AddPointer(RegionOfInterest); } std::shared_ptr VisitNode(const ExplodedNode *N, BugReporterContext &BR, BugReport &) override { const LocationContext *Ctx = N->getLocationContext(); const StackFrameContext *SCtx = Ctx->getStackFrame(); ProgramStateRef State = N->getState(); auto CallExitLoc = N->getLocationAs(); // No diagnostic if region was modified inside the frame. if (!CallExitLoc || isRegionOfInterestModifiedInFrame(N)) return nullptr; CallEventRef<> Call = BR.getStateManager().getCallEventManager().getCaller(SCtx, State); if (SM.isInSystemHeader(Call->getDecl()->getSourceRange().getBegin())) return nullptr; // Region of interest corresponds to an IVar, exiting a method // which could have written into that IVar, but did not. if (const auto *MC = dyn_cast(Call)) { if (const auto *IvarR = dyn_cast(RegionOfInterest)) { const MemRegion *SelfRegion = MC->getReceiverSVal().getAsRegion(); if (RegionOfInterest->isSubRegionOf(SelfRegion) && potentiallyWritesIntoIvar(Call->getRuntimeDefinition().getDecl(), IvarR->getDecl())) return notModifiedDiagnostics(N, {}, SelfRegion, "self", /*FirstIsReferenceType=*/false, 1); } } if (const auto *CCall = dyn_cast(Call)) { const MemRegion *ThisR = CCall->getCXXThisVal().getAsRegion(); if (RegionOfInterest->isSubRegionOf(ThisR) && !CCall->getDecl()->isImplicit()) return notModifiedDiagnostics(N, {}, ThisR, "this", /*FirstIsReferenceType=*/false, 1); // Do not generate diagnostics for not modified parameters in // constructors. return nullptr; } ArrayRef parameters = getCallParameters(Call); for (unsigned I = 0; I < Call->getNumArgs() && I < parameters.size(); ++I) { const ParmVarDecl *PVD = parameters[I]; SVal S = Call->getArgSVal(I); bool ParamIsReferenceType = PVD->getType()->isReferenceType(); std::string ParamName = PVD->getNameAsString(); int IndirectionLevel = 1; QualType T = PVD->getType(); while (const MemRegion *R = S.getAsRegion()) { if (RegionOfInterest->isSubRegionOf(R) && !isPointerToConst(T)) return notModifiedDiagnostics(N, {}, R, ParamName, ParamIsReferenceType, IndirectionLevel); QualType PT = T->getPointeeType(); if (PT.isNull() || PT->isVoidType()) break; if (const RecordDecl *RD = PT->getAsRecordDecl()) if (auto P = findRegionOfInterestInRecord(RD, State, R)) return notModifiedDiagnostics(N, *P, RegionOfInterest, ParamName, ParamIsReferenceType, IndirectionLevel); S = State->getSVal(R, PT); T = PT; IndirectionLevel++; } } return nullptr; } private: /// Attempts to find the region of interest in a given CXX decl, /// by either following the base classes or fields. /// Dereferences fields up to a given recursion limit. /// Note that \p Vec is passed by value, leading to quadratic copying cost, /// but it's OK in practice since its length is limited to DEREFERENCE_LIMIT. /// \return A chain fields leading to the region of interest or None. const Optional findRegionOfInterestInRecord(const RecordDecl *RD, ProgramStateRef State, const MemRegion *R, const RegionVector &Vec = {}, int depth = 0) { if (depth == DEREFERENCE_LIMIT) // Limit the recursion depth. return None; if (const auto *RDX = dyn_cast(RD)) if (!RDX->hasDefinition()) return None; // Recursively examine the base classes. // Note that following base classes does not increase the recursion depth. if (const auto *RDX = dyn_cast(RD)) for (const auto II : RDX->bases()) if (const RecordDecl *RRD = II.getType()->getAsRecordDecl()) if (auto Out = findRegionOfInterestInRecord(RRD, State, R, Vec, depth)) return Out; for (const FieldDecl *I : RD->fields()) { QualType FT = I->getType(); const FieldRegion *FR = MmrMgr.getFieldRegion(I, cast(R)); const SVal V = State->getSVal(FR); const MemRegion *VR = V.getAsRegion(); RegionVector VecF = Vec; VecF.push_back(FR); if (RegionOfInterest == VR) return VecF; if (const RecordDecl *RRD = FT->getAsRecordDecl()) if (auto Out = findRegionOfInterestInRecord(RRD, State, FR, VecF, depth + 1)) return Out; QualType PT = FT->getPointeeType(); if (PT.isNull() || PT->isVoidType() || !VR) continue; if (const RecordDecl *RRD = PT->getAsRecordDecl()) if (auto Out = findRegionOfInterestInRecord(RRD, State, VR, VecF, depth + 1)) return Out; } return None; } /// \return Whether the method declaration \p Parent /// syntactically has a binary operation writing into the ivar \p Ivar. bool potentiallyWritesIntoIvar(const Decl *Parent, const ObjCIvarDecl *Ivar) { using namespace ast_matchers; const char * IvarBind = "Ivar"; if (!Parent || !Parent->hasBody()) return false; StatementMatcher WriteIntoIvarM = binaryOperator( hasOperatorName("="), hasLHS(ignoringParenImpCasts( objcIvarRefExpr(hasDeclaration(equalsNode(Ivar))).bind(IvarBind)))); StatementMatcher ParentM = stmt(hasDescendant(WriteIntoIvarM)); auto Matches = match(ParentM, *Parent->getBody(), Parent->getASTContext()); for (BoundNodes &Match : Matches) { auto IvarRef = Match.getNodeAs(IvarBind); if (IvarRef->isFreeIvar()) return true; const Expr *Base = IvarRef->getBase(); if (const auto *ICE = dyn_cast(Base)) Base = ICE->getSubExpr(); if (const auto *DRE = dyn_cast(Base)) if (const auto *ID = dyn_cast(DRE->getDecl())) if (ID->getParameterKind() == ImplicitParamDecl::ObjCSelf) return true; return false; } return false; } /// Check and lazily calculate whether the region of interest is /// modified in the stack frame to which \p N belongs. /// The calculation is cached in FramesModifyingRegion. bool isRegionOfInterestModifiedInFrame(const ExplodedNode *N) { const LocationContext *Ctx = N->getLocationContext(); const StackFrameContext *SCtx = Ctx->getStackFrame(); if (!FramesModifyingCalculated.count(SCtx)) findModifyingFrames(N); return FramesModifyingRegion.count(SCtx); } /// Write to \c FramesModifyingRegion all stack frames along /// the path in the current stack frame which modify \c RegionOfInterest. void findModifyingFrames(const ExplodedNode *N) { assert(N->getLocationAs()); ProgramStateRef LastReturnState = N->getState(); SVal ValueAtReturn = LastReturnState->getSVal(RegionOfInterest); const LocationContext *Ctx = N->getLocationContext(); const StackFrameContext *OriginalSCtx = Ctx->getStackFrame(); do { ProgramStateRef State = N->getState(); auto CallExitLoc = N->getLocationAs(); if (CallExitLoc) { LastReturnState = State; ValueAtReturn = LastReturnState->getSVal(RegionOfInterest); } FramesModifyingCalculated.insert( N->getLocationContext()->getStackFrame()); if (wasRegionOfInterestModifiedAt(RegionOfInterest, N, ValueAtReturn)) { const StackFrameContext *SCtx = N->getStackFrame(); while (!SCtx->inTopFrame()) { auto p = FramesModifyingRegion.insert(SCtx); if (!p.second) break; // Frame and all its parents already inserted. SCtx = SCtx->getParent()->getStackFrame(); } } // Stop calculation at the call to the current function. if (auto CE = N->getLocationAs()) if (CE->getCalleeContext() == OriginalSCtx) break; N = N->getFirstPred(); } while (N); } /// Get parameters associated with runtime definition in order /// to get the correct parameter name. ArrayRef getCallParameters(CallEventRef<> Call) { // Use runtime definition, if available. RuntimeDefinition RD = Call->getRuntimeDefinition(); if (const auto *FD = dyn_cast_or_null(RD.getDecl())) return FD->parameters(); if (const auto *MD = dyn_cast_or_null(RD.getDecl())) return MD->parameters(); return Call->parameters(); } /// \return whether \p Ty points to a const type, or is a const reference. bool isPointerToConst(QualType Ty) { return !Ty->getPointeeType().isNull() && Ty->getPointeeType().getCanonicalType().isConstQualified(); } /// \return Diagnostics piece for region not modified in the current function. std::shared_ptr notModifiedDiagnostics(const ExplodedNode *N, const RegionVector &FieldChain, const MemRegion *MatchedRegion, StringRef FirstElement, bool FirstIsReferenceType, unsigned IndirectionLevel) { PathDiagnosticLocation L = PathDiagnosticLocation::create(N->getLocation(), SM); SmallString<256> sbuf; llvm::raw_svector_ostream os(sbuf); os << "Returning without writing to '"; // Do not generate the note if failed to pretty-print. if (!prettyPrintRegionName(FirstElement, FirstIsReferenceType, MatchedRegion, FieldChain, IndirectionLevel, os)) return nullptr; os << "'"; return std::make_shared(L, os.str()); } /// Pretty-print region \p MatchedRegion to \p os. /// \return Whether printing succeeded. bool prettyPrintRegionName(StringRef FirstElement, bool FirstIsReferenceType, const MemRegion *MatchedRegion, const RegionVector &FieldChain, int IndirectionLevel, llvm::raw_svector_ostream &os) { if (FirstIsReferenceType) IndirectionLevel--; RegionVector RegionSequence; // Add the regions in the reverse order, then reverse the resulting array. assert(RegionOfInterest->isSubRegionOf(MatchedRegion)); const MemRegion *R = RegionOfInterest; while (R != MatchedRegion) { RegionSequence.push_back(R); R = cast(R)->getSuperRegion(); } std::reverse(RegionSequence.begin(), RegionSequence.end()); RegionSequence.append(FieldChain.begin(), FieldChain.end()); StringRef Sep; for (const MemRegion *R : RegionSequence) { // Just keep going up to the base region. // Element regions may appear due to casts. if (isa(R) || isa(R)) continue; if (Sep.empty()) Sep = prettyPrintFirstElement(FirstElement, /*MoreItemsExpected=*/true, IndirectionLevel, os); os << Sep; // Can only reasonably pretty-print DeclRegions. if (!isa(R)) return false; const auto *DR = cast(R); Sep = DR->getValueType()->isAnyPointerType() ? "->" : "."; DR->getDecl()->getDeclName().print(os, PP); } if (Sep.empty()) prettyPrintFirstElement(FirstElement, /*MoreItemsExpected=*/false, IndirectionLevel, os); return true; } /// Print first item in the chain, return new separator. StringRef prettyPrintFirstElement(StringRef FirstElement, bool MoreItemsExpected, int IndirectionLevel, llvm::raw_svector_ostream &os) { StringRef Out = "."; if (IndirectionLevel > 0 && MoreItemsExpected) { IndirectionLevel--; Out = "->"; } if (IndirectionLevel > 0 && MoreItemsExpected) os << "("; for (int i=0; i 0 && MoreItemsExpected) os << ")"; return Out; } }; /// Suppress null-pointer-dereference bugs where dereferenced null was returned /// the macro. class MacroNullReturnSuppressionVisitor final : public BugReporterVisitor { const SubRegion *RegionOfInterest; const SVal ValueAtDereference; // Do not invalidate the reports where the value was modified // after it got assigned to from the macro. bool WasModified = false; public: MacroNullReturnSuppressionVisitor(const SubRegion *R, const SVal V) : RegionOfInterest(R), ValueAtDereference(V) {} std::shared_ptr VisitNode(const ExplodedNode *N, BugReporterContext &BRC, BugReport &BR) override { if (WasModified) return nullptr; auto BugPoint = BR.getErrorNode()->getLocation().getAs(); if (!BugPoint) return nullptr; const SourceManager &SMgr = BRC.getSourceManager(); if (auto Loc = matchAssignment(N)) { if (isFunctionMacroExpansion(*Loc, SMgr)) { std::string MacroName = getMacroName(*Loc, BRC); SourceLocation BugLoc = BugPoint->getStmt()->getBeginLoc(); if (!BugLoc.isMacroID() || getMacroName(BugLoc, BRC) != MacroName) BR.markInvalid(getTag(), MacroName.c_str()); } } if (wasRegionOfInterestModifiedAt(RegionOfInterest, N, ValueAtDereference)) WasModified = true; return nullptr; } static void addMacroVisitorIfNecessary( const ExplodedNode *N, const MemRegion *R, bool EnableNullFPSuppression, BugReport &BR, const SVal V) { AnalyzerOptions &Options = N->getState()->getAnalysisManager().options; if (EnableNullFPSuppression && Options.ShouldSuppressNullReturnPaths && V.getAs()) BR.addVisitor(llvm::make_unique( R->getAs(), V)); } void* getTag() const { static int Tag = 0; return static_cast(&Tag); } void Profile(llvm::FoldingSetNodeID &ID) const override { ID.AddPointer(getTag()); } private: /// \return Source location of right hand side of an assignment /// into \c RegionOfInterest, empty optional if none found. Optional matchAssignment(const ExplodedNode *N) { const Stmt *S = PathDiagnosticLocation::getStmt(N); ProgramStateRef State = N->getState(); auto *LCtx = N->getLocationContext(); if (!S) return None; if (const auto *DS = dyn_cast(S)) { if (const auto *VD = dyn_cast(DS->getSingleDecl())) if (const Expr *RHS = VD->getInit()) if (RegionOfInterest->isSubRegionOf( State->getLValue(VD, LCtx).getAsRegion())) return RHS->getBeginLoc(); } else if (const auto *BO = dyn_cast(S)) { const MemRegion *R = N->getSVal(BO->getLHS()).getAsRegion(); const Expr *RHS = BO->getRHS(); if (BO->isAssignmentOp() && RegionOfInterest->isSubRegionOf(R)) { return RHS->getBeginLoc(); } } return None; } }; /// Emits an extra note at the return statement of an interesting stack frame. /// /// The returned value is marked as an interesting value, and if it's null, /// adds a visitor to track where it became null. /// /// This visitor is intended to be used when another visitor discovers that an /// interesting value comes from an inlined function call. class ReturnVisitor : public BugReporterVisitor { const StackFrameContext *StackFrame; enum { Initial, MaybeUnsuppress, Satisfied } Mode = Initial; bool EnableNullFPSuppression; bool ShouldInvalidate = true; AnalyzerOptions& Options; public: ReturnVisitor(const StackFrameContext *Frame, bool Suppressed, AnalyzerOptions &Options) : StackFrame(Frame), EnableNullFPSuppression(Suppressed), Options(Options) {} static void *getTag() { static int Tag = 0; return static_cast(&Tag); } void Profile(llvm::FoldingSetNodeID &ID) const override { ID.AddPointer(ReturnVisitor::getTag()); ID.AddPointer(StackFrame); ID.AddBoolean(EnableNullFPSuppression); } /// Adds a ReturnVisitor if the given statement represents a call that was /// inlined. /// /// This will search back through the ExplodedGraph, starting from the given /// node, looking for when the given statement was processed. If it turns out /// the statement is a call that was inlined, we add the visitor to the /// bug report, so it can print a note later. static void addVisitorIfNecessary(const ExplodedNode *Node, const Stmt *S, BugReport &BR, bool InEnableNullFPSuppression) { if (!CallEvent::isCallStmt(S)) return; // First, find when we processed the statement. do { if (auto CEE = Node->getLocationAs()) if (CEE->getCalleeContext()->getCallSite() == S) break; if (auto SP = Node->getLocationAs()) if (SP->getStmt() == S) break; Node = Node->getFirstPred(); } while (Node); // Next, step over any post-statement checks. while (Node && Node->getLocation().getAs()) Node = Node->getFirstPred(); if (!Node) return; // Finally, see if we inlined the call. Optional CEE = Node->getLocationAs(); if (!CEE) return; const StackFrameContext *CalleeContext = CEE->getCalleeContext(); if (CalleeContext->getCallSite() != S) return; // Check the return value. ProgramStateRef State = Node->getState(); SVal RetVal = Node->getSVal(S); // Handle cases where a reference is returned and then immediately used. if (cast(S)->isGLValue()) if (Optional LValue = RetVal.getAs()) RetVal = State->getSVal(*LValue); // See if the return value is NULL. If so, suppress the report. AnalyzerOptions &Options = State->getAnalysisManager().options; bool EnableNullFPSuppression = false; if (InEnableNullFPSuppression && Options.ShouldSuppressNullReturnPaths) if (Optional RetLoc = RetVal.getAs()) EnableNullFPSuppression = State->isNull(*RetLoc).isConstrainedTrue(); BR.markInteresting(CalleeContext); BR.addVisitor(llvm::make_unique(CalleeContext, EnableNullFPSuppression, Options)); } std::shared_ptr visitNodeInitial(const ExplodedNode *N, BugReporterContext &BRC, BugReport &BR) { // Only print a message at the interesting return statement. if (N->getLocationContext() != StackFrame) return nullptr; Optional SP = N->getLocationAs(); if (!SP) return nullptr; const auto *Ret = dyn_cast(SP->getStmt()); if (!Ret) return nullptr; // Okay, we're at the right return statement, but do we have the return // value available? ProgramStateRef State = N->getState(); SVal V = State->getSVal(Ret, StackFrame); if (V.isUnknownOrUndef()) return nullptr; // Don't print any more notes after this one. Mode = Satisfied; const Expr *RetE = Ret->getRetValue(); assert(RetE && "Tracking a return value for a void function"); // Handle cases where a reference is returned and then immediately used. Optional LValue; if (RetE->isGLValue()) { if ((LValue = V.getAs())) { SVal RValue = State->getRawSVal(*LValue, RetE->getType()); if (RValue.getAs()) V = RValue; } } // Ignore aggregate rvalues. if (V.getAs() || V.getAs()) return nullptr; RetE = RetE->IgnoreParenCasts(); // If we're returning 0, we should track where that 0 came from. bugreporter::trackExpressionValue(N, RetE, BR, EnableNullFPSuppression); // Build an appropriate message based on the return value. SmallString<64> Msg; llvm::raw_svector_ostream Out(Msg); if (State->isNull(V).isConstrainedTrue()) { if (V.getAs()) { // If we have counter-suppression enabled, make sure we keep visiting // future nodes. We want to emit a path note as well, in case // the report is resurrected as valid later on. if (EnableNullFPSuppression && Options.ShouldAvoidSuppressingNullArgumentPaths) Mode = MaybeUnsuppress; if (RetE->getType()->isObjCObjectPointerType()) { Out << "Returning nil"; } else { Out << "Returning null pointer"; } } else { Out << "Returning zero"; } } else { if (auto CI = V.getAs()) { Out << "Returning the value " << CI->getValue(); } else if (V.getAs()) { Out << "Returning pointer"; } else { Out << "Returning value"; } } if (LValue) { if (const MemRegion *MR = LValue->getAsRegion()) { if (MR->canPrintPretty()) { Out << " (reference to "; MR->printPretty(Out); Out << ")"; } } } else { // FIXME: We should have a more generalized location printing mechanism. if (const auto *DR = dyn_cast(RetE)) if (const auto *DD = dyn_cast(DR->getDecl())) Out << " (loaded from '" << *DD << "')"; } PathDiagnosticLocation L(Ret, BRC.getSourceManager(), StackFrame); if (!L.isValid() || !L.asLocation().isValid()) return nullptr; return std::make_shared(L, Out.str()); } std::shared_ptr visitNodeMaybeUnsuppress(const ExplodedNode *N, BugReporterContext &BRC, BugReport &BR) { #ifndef NDEBUG assert(Options.ShouldAvoidSuppressingNullArgumentPaths); #endif // Are we at the entry node for this call? Optional CE = N->getLocationAs(); if (!CE) return nullptr; if (CE->getCalleeContext() != StackFrame) return nullptr; Mode = Satisfied; // Don't automatically suppress a report if one of the arguments is // known to be a null pointer. Instead, start tracking /that/ null // value back to its origin. ProgramStateManager &StateMgr = BRC.getStateManager(); CallEventManager &CallMgr = StateMgr.getCallEventManager(); ProgramStateRef State = N->getState(); CallEventRef<> Call = CallMgr.getCaller(StackFrame, State); for (unsigned I = 0, E = Call->getNumArgs(); I != E; ++I) { Optional ArgV = Call->getArgSVal(I).getAs(); if (!ArgV) continue; const Expr *ArgE = Call->getArgExpr(I); if (!ArgE) continue; // Is it possible for this argument to be non-null? if (!State->isNull(*ArgV).isConstrainedTrue()) continue; if (bugreporter::trackExpressionValue(N, ArgE, BR, EnableNullFPSuppression)) ShouldInvalidate = false; // If we /can't/ track the null pointer, we should err on the side of // false negatives, and continue towards marking this report invalid. // (We will still look at the other arguments, though.) } return nullptr; } std::shared_ptr VisitNode(const ExplodedNode *N, BugReporterContext &BRC, BugReport &BR) override { switch (Mode) { case Initial: return visitNodeInitial(N, BRC, BR); case MaybeUnsuppress: return visitNodeMaybeUnsuppress(N, BRC, BR); case Satisfied: return nullptr; } llvm_unreachable("Invalid visit mode!"); } void finalizeVisitor(BugReporterContext &, const ExplodedNode *, BugReport &BR) override { if (EnableNullFPSuppression && ShouldInvalidate) BR.markInvalid(ReturnVisitor::getTag(), StackFrame); } }; } // namespace void FindLastStoreBRVisitor::Profile(llvm::FoldingSetNodeID &ID) const { static int tag = 0; ID.AddPointer(&tag); ID.AddPointer(R); ID.Add(V); ID.AddBoolean(EnableNullFPSuppression); } /// Returns true if \p N represents the DeclStmt declaring and initializing /// \p VR. static bool isInitializationOfVar(const ExplodedNode *N, const VarRegion *VR) { Optional P = N->getLocationAs(); if (!P) return false; const DeclStmt *DS = P->getStmtAs(); if (!DS) return false; if (DS->getSingleDecl() != VR->getDecl()) return false; const MemSpaceRegion *VarSpace = VR->getMemorySpace(); const auto *FrameSpace = dyn_cast(VarSpace); if (!FrameSpace) { // If we ever directly evaluate global DeclStmts, this assertion will be // invalid, but this still seems preferable to silently accepting an // initialization that may be for a path-sensitive variable. assert(VR->getDecl()->isStaticLocal() && "non-static stackless VarRegion"); return true; } assert(VR->getDecl()->hasLocalStorage()); const LocationContext *LCtx = N->getLocationContext(); return FrameSpace->getStackFrame() == LCtx->getStackFrame(); } /// Show diagnostics for initializing or declaring a region \p R with a bad value. static void showBRDiagnostics(const char *action, llvm::raw_svector_ostream &os, const MemRegion *R, SVal V, const DeclStmt *DS) { if (R->canPrintPretty()) { R->printPretty(os); os << " "; } if (V.getAs()) { bool b = false; if (R->isBoundable()) { if (const auto *TR = dyn_cast(R)) { if (TR->getValueType()->isObjCObjectPointerType()) { os << action << "nil"; b = true; } } } if (!b) os << action << "a null pointer value"; } else if (auto CVal = V.getAs()) { os << action << CVal->getValue(); } else if (DS) { if (V.isUndef()) { if (isa(R)) { const auto *VD = cast(DS->getSingleDecl()); if (VD->getInit()) { os << (R->canPrintPretty() ? "initialized" : "Initializing") << " to a garbage value"; } else { os << (R->canPrintPretty() ? "declared" : "Declaring") << " without an initial value"; } } } else { os << (R->canPrintPretty() ? "initialized" : "Initialized") << " here"; } } } /// Display diagnostics for passing bad region as a parameter. static void showBRParamDiagnostics(llvm::raw_svector_ostream& os, const VarRegion *VR, SVal V) { const auto *Param = cast(VR->getDecl()); os << "Passing "; if (V.getAs()) { if (Param->getType()->isObjCObjectPointerType()) os << "nil object reference"; else os << "null pointer value"; } else if (V.isUndef()) { os << "uninitialized value"; } else if (auto CI = V.getAs()) { os << "the value " << CI->getValue(); } else { os << "value"; } // Printed parameter indexes are 1-based, not 0-based. unsigned Idx = Param->getFunctionScopeIndex() + 1; os << " via " << Idx << llvm::getOrdinalSuffix(Idx) << " parameter"; if (VR->canPrintPretty()) { os << " "; VR->printPretty(os); } } /// Show default diagnostics for storing bad region. static void showBRDefaultDiagnostics(llvm::raw_svector_ostream& os, const MemRegion *R, SVal V) { if (V.getAs()) { bool b = false; if (R->isBoundable()) { if (const auto *TR = dyn_cast(R)) { if (TR->getValueType()->isObjCObjectPointerType()) { os << "nil object reference stored"; b = true; } } } if (!b) { if (R->canPrintPretty()) os << "Null pointer value stored"; else os << "Storing null pointer value"; } } else if (V.isUndef()) { if (R->canPrintPretty()) os << "Uninitialized value stored"; else os << "Storing uninitialized value"; } else if (auto CV = V.getAs()) { if (R->canPrintPretty()) os << "The value " << CV->getValue() << " is assigned"; else os << "Assigning " << CV->getValue(); } else { if (R->canPrintPretty()) os << "Value assigned"; else os << "Assigning value"; } if (R->canPrintPretty()) { os << " to "; R->printPretty(os); } } std::shared_ptr FindLastStoreBRVisitor::VisitNode(const ExplodedNode *Succ, BugReporterContext &BRC, BugReport &BR) { if (Satisfied) return nullptr; const ExplodedNode *StoreSite = nullptr; const ExplodedNode *Pred = Succ->getFirstPred(); const Expr *InitE = nullptr; bool IsParam = false; // First see if we reached the declaration of the region. if (const auto *VR = dyn_cast(R)) { if (isInitializationOfVar(Pred, VR)) { StoreSite = Pred; InitE = VR->getDecl()->getInit(); } } // If this is a post initializer expression, initializing the region, we // should track the initializer expression. if (Optional PIP = Pred->getLocationAs()) { const MemRegion *FieldReg = (const MemRegion *)PIP->getLocationValue(); if (FieldReg && FieldReg == R) { StoreSite = Pred; InitE = PIP->getInitializer()->getInit(); } } // Otherwise, see if this is the store site: // (1) Succ has this binding and Pred does not, i.e. this is // where the binding first occurred. // (2) Succ has this binding and is a PostStore node for this region, i.e. // the same binding was re-assigned here. if (!StoreSite) { if (Succ->getState()->getSVal(R) != V) return nullptr; if (Pred->getState()->getSVal(R) == V) { Optional PS = Succ->getLocationAs(); if (!PS || PS->getLocationValue() != R) return nullptr; } StoreSite = Succ; // If this is an assignment expression, we can track the value // being assigned. if (Optional P = Succ->getLocationAs()) if (const BinaryOperator *BO = P->getStmtAs()) if (BO->isAssignmentOp()) InitE = BO->getRHS(); // If this is a call entry, the variable should be a parameter. // FIXME: Handle CXXThisRegion as well. (This is not a priority because // 'this' should never be NULL, but this visitor isn't just for NULL and // UndefinedVal.) if (Optional CE = Succ->getLocationAs()) { if (const auto *VR = dyn_cast(R)) { const auto *Param = cast(VR->getDecl()); ProgramStateManager &StateMgr = BRC.getStateManager(); CallEventManager &CallMgr = StateMgr.getCallEventManager(); CallEventRef<> Call = CallMgr.getCaller(CE->getCalleeContext(), Succ->getState()); InitE = Call->getArgExpr(Param->getFunctionScopeIndex()); IsParam = true; } } // If this is a CXXTempObjectRegion, the Expr responsible for its creation // is wrapped inside of it. if (const auto *TmpR = dyn_cast(R)) InitE = TmpR->getExpr(); } if (!StoreSite) return nullptr; Satisfied = true; // If we have an expression that provided the value, try to track where it // came from. if (InitE) { if (V.isUndef() || V.getAs() || V.getAs()) { if (!IsParam) InitE = InitE->IgnoreParenCasts(); bugreporter::trackExpressionValue(StoreSite, InitE, BR, EnableNullFPSuppression); } ReturnVisitor::addVisitorIfNecessary(StoreSite, InitE->IgnoreParenCasts(), BR, EnableNullFPSuppression); } // Okay, we've found the binding. Emit an appropriate message. SmallString<256> sbuf; llvm::raw_svector_ostream os(sbuf); if (Optional PS = StoreSite->getLocationAs()) { const Stmt *S = PS->getStmt(); const char *action = nullptr; const auto *DS = dyn_cast(S); const auto *VR = dyn_cast(R); if (DS) { action = R->canPrintPretty() ? "initialized to " : "Initializing to "; } else if (isa(S)) { action = R->canPrintPretty() ? "captured by block as " : "Captured by block as "; if (VR) { // See if we can get the BlockVarRegion. ProgramStateRef State = StoreSite->getState(); SVal V = StoreSite->getSVal(S); if (const auto *BDR = dyn_cast_or_null(V.getAsRegion())) { if (const VarRegion *OriginalR = BDR->getOriginalRegion(VR)) { if (auto KV = State->getSVal(OriginalR).getAs()) BR.addVisitor(llvm::make_unique( *KV, OriginalR, EnableNullFPSuppression)); } } } } if (action) showBRDiagnostics(action, os, R, V, DS); } else if (StoreSite->getLocation().getAs()) { if (const auto *VR = dyn_cast(R)) showBRParamDiagnostics(os, VR, V); } if (os.str().empty()) showBRDefaultDiagnostics(os, R, V); // Construct a new PathDiagnosticPiece. ProgramPoint P = StoreSite->getLocation(); PathDiagnosticLocation L; if (P.getAs() && InitE) L = PathDiagnosticLocation(InitE, BRC.getSourceManager(), P.getLocationContext()); if (!L.isValid() || !L.asLocation().isValid()) L = PathDiagnosticLocation::create(P, BRC.getSourceManager()); if (!L.isValid() || !L.asLocation().isValid()) return nullptr; return std::make_shared(L, os.str()); } void TrackConstraintBRVisitor::Profile(llvm::FoldingSetNodeID &ID) const { static int tag = 0; ID.AddPointer(&tag); ID.AddBoolean(Assumption); ID.Add(Constraint); } /// Return the tag associated with this visitor. This tag will be used /// to make all PathDiagnosticPieces created by this visitor. const char *TrackConstraintBRVisitor::getTag() { return "TrackConstraintBRVisitor"; } bool TrackConstraintBRVisitor::isUnderconstrained(const ExplodedNode *N) const { if (IsZeroCheck) return N->getState()->isNull(Constraint).isUnderconstrained(); return (bool)N->getState()->assume(Constraint, !Assumption); } std::shared_ptr TrackConstraintBRVisitor::VisitNode(const ExplodedNode *N, BugReporterContext &BRC, BugReport &) { const ExplodedNode *PrevN = N->getFirstPred(); if (IsSatisfied) return nullptr; // Start tracking after we see the first state in which the value is // constrained. if (!IsTrackingTurnedOn) if (!isUnderconstrained(N)) IsTrackingTurnedOn = true; if (!IsTrackingTurnedOn) return nullptr; // Check if in the previous state it was feasible for this constraint // to *not* be true. if (isUnderconstrained(PrevN)) { IsSatisfied = true; // As a sanity check, make sure that the negation of the constraint // was infeasible in the current state. If it is feasible, we somehow // missed the transition point. assert(!isUnderconstrained(N)); // We found the transition point for the constraint. We now need to // pretty-print the constraint. (work-in-progress) SmallString<64> sbuf; llvm::raw_svector_ostream os(sbuf); if (Constraint.getAs()) { os << "Assuming pointer value is "; os << (Assumption ? "non-null" : "null"); } if (os.str().empty()) return nullptr; // Construct a new PathDiagnosticPiece. ProgramPoint P = N->getLocation(); PathDiagnosticLocation L = PathDiagnosticLocation::create(P, BRC.getSourceManager()); if (!L.isValid()) return nullptr; auto X = std::make_shared(L, os.str()); X->setTag(getTag()); return std::move(X); } return nullptr; } SuppressInlineDefensiveChecksVisitor:: SuppressInlineDefensiveChecksVisitor(DefinedSVal Value, const ExplodedNode *N) : V(Value) { // Check if the visitor is disabled. AnalyzerOptions &Options = N->getState()->getAnalysisManager().options; if (!Options.ShouldSuppressInlinedDefensiveChecks) IsSatisfied = true; assert(N->getState()->isNull(V).isConstrainedTrue() && "The visitor only tracks the cases where V is constrained to 0"); } void SuppressInlineDefensiveChecksVisitor::Profile( llvm::FoldingSetNodeID &ID) const { static int id = 0; ID.AddPointer(&id); ID.Add(V); } const char *SuppressInlineDefensiveChecksVisitor::getTag() { return "IDCVisitor"; } std::shared_ptr SuppressInlineDefensiveChecksVisitor::VisitNode(const ExplodedNode *Succ, BugReporterContext &BRC, BugReport &BR) { const ExplodedNode *Pred = Succ->getFirstPred(); if (IsSatisfied) return nullptr; // Start tracking after we see the first state in which the value is null. if (!IsTrackingTurnedOn) if (Succ->getState()->isNull(V).isConstrainedTrue()) IsTrackingTurnedOn = true; if (!IsTrackingTurnedOn) return nullptr; // Check if in the previous state it was feasible for this value // to *not* be null. if (!Pred->getState()->isNull(V).isConstrainedTrue()) { IsSatisfied = true; assert(Succ->getState()->isNull(V).isConstrainedTrue()); // Check if this is inlined defensive checks. const LocationContext *CurLC =Succ->getLocationContext(); const LocationContext *ReportLC = BR.getErrorNode()->getLocationContext(); if (CurLC != ReportLC && !CurLC->isParentOf(ReportLC)) { BR.markInvalid("Suppress IDC", CurLC); return nullptr; } // Treat defensive checks in function-like macros as if they were an inlined // defensive check. If the bug location is not in a macro and the // terminator for the current location is in a macro then suppress the // warning. auto BugPoint = BR.getErrorNode()->getLocation().getAs(); if (!BugPoint) return nullptr; ProgramPoint CurPoint = Succ->getLocation(); const Stmt *CurTerminatorStmt = nullptr; if (auto BE = CurPoint.getAs()) { CurTerminatorStmt = BE->getSrc()->getTerminator().getStmt(); } else if (auto SP = CurPoint.getAs()) { const Stmt *CurStmt = SP->getStmt(); if (!CurStmt->getBeginLoc().isMacroID()) return nullptr; CFGStmtMap *Map = CurLC->getAnalysisDeclContext()->getCFGStmtMap(); CurTerminatorStmt = Map->getBlock(CurStmt)->getTerminator(); } else { return nullptr; } if (!CurTerminatorStmt) return nullptr; SourceLocation TerminatorLoc = CurTerminatorStmt->getBeginLoc(); if (TerminatorLoc.isMacroID()) { SourceLocation BugLoc = BugPoint->getStmt()->getBeginLoc(); // Suppress reports unless we are in that same macro. if (!BugLoc.isMacroID() || getMacroName(BugLoc, BRC) != getMacroName(TerminatorLoc, BRC)) { BR.markInvalid("Suppress Macro IDC", CurLC); } return nullptr; } } return nullptr; } static const MemRegion *getLocationRegionIfReference(const Expr *E, const ExplodedNode *N) { if (const auto *DR = dyn_cast(E)) { if (const auto *VD = dyn_cast(DR->getDecl())) { if (!VD->getType()->isReferenceType()) return nullptr; ProgramStateManager &StateMgr = N->getState()->getStateManager(); MemRegionManager &MRMgr = StateMgr.getRegionManager(); return MRMgr.getVarRegion(VD, N->getLocationContext()); } } // FIXME: This does not handle other kinds of null references, // for example, references from FieldRegions: // struct Wrapper { int &ref; }; // Wrapper w = { *(int *)0 }; // w.ref = 1; return nullptr; } /// \return A subexpression of {@code Ex} which represents the /// expression-of-interest. static const Expr *peelOffOuterExpr(const Expr *Ex, const ExplodedNode *N) { Ex = Ex->IgnoreParenCasts(); if (const auto *FE = dyn_cast(Ex)) return peelOffOuterExpr(FE->getSubExpr(), N); if (const auto *OVE = dyn_cast(Ex)) return peelOffOuterExpr(OVE->getSourceExpr(), N); if (const auto *POE = dyn_cast(Ex)) { const auto *PropRef = dyn_cast(POE->getSyntacticForm()); if (PropRef && PropRef->isMessagingGetter()) { const Expr *GetterMessageSend = POE->getSemanticExpr(POE->getNumSemanticExprs() - 1); assert(isa(GetterMessageSend->IgnoreParenCasts())); return peelOffOuterExpr(GetterMessageSend, N); } } // Peel off the ternary operator. if (const auto *CO = dyn_cast(Ex)) { // Find a node where the branching occurred and find out which branch // we took (true/false) by looking at the ExplodedGraph. const ExplodedNode *NI = N; do { ProgramPoint ProgPoint = NI->getLocation(); if (Optional BE = ProgPoint.getAs()) { const CFGBlock *srcBlk = BE->getSrc(); if (const Stmt *term = srcBlk->getTerminator()) { if (term == CO) { bool TookTrueBranch = (*(srcBlk->succ_begin()) == BE->getDst()); if (TookTrueBranch) return peelOffOuterExpr(CO->getTrueExpr(), N); else return peelOffOuterExpr(CO->getFalseExpr(), N); } } } NI = NI->getFirstPred(); } while (NI); } if (auto *BO = dyn_cast(Ex)) if (const Expr *SubEx = peelOffPointerArithmetic(BO)) return peelOffOuterExpr(SubEx, N); if (auto *UO = dyn_cast(Ex)) { if (UO->getOpcode() == UO_LNot) return peelOffOuterExpr(UO->getSubExpr(), N); // FIXME: There's a hack in our Store implementation that always computes // field offsets around null pointers as if they are always equal to 0. // The idea here is to report accesses to fields as null dereferences // even though the pointer value that's being dereferenced is actually // the offset of the field rather than exactly 0. // See the FIXME in StoreManager's getLValueFieldOrIvar() method. // This code interacts heavily with this hack; otherwise the value // would not be null at all for most fields, so we'd be unable to track it. if (UO->getOpcode() == UO_AddrOf && UO->getSubExpr()->isLValue()) if (const Expr *DerefEx = bugreporter::getDerefExpr(UO->getSubExpr())) return peelOffOuterExpr(DerefEx, N); } return Ex; } /// Find the ExplodedNode where the lvalue (the value of 'Ex') /// was computed. static const ExplodedNode* findNodeForExpression(const ExplodedNode *N, const Expr *Inner) { while (N) { if (PathDiagnosticLocation::getStmt(N) == Inner) return N; N = N->getFirstPred(); } return N; } bool bugreporter::trackExpressionValue(const ExplodedNode *InputNode, const Expr *E, BugReport &report, bool EnableNullFPSuppression) { if (!E || !InputNode) return false; const Expr *Inner = peelOffOuterExpr(E, InputNode); const ExplodedNode *LVNode = findNodeForExpression(InputNode, Inner); if (!LVNode) return false; ProgramStateRef LVState = LVNode->getState(); // The message send could be nil due to the receiver being nil. // At this point in the path, the receiver should be live since we are at the // message send expr. If it is nil, start tracking it. if (const Expr *Receiver = NilReceiverBRVisitor::getNilReceiver(Inner, LVNode)) trackExpressionValue(LVNode, Receiver, report, EnableNullFPSuppression); // See if the expression we're interested refers to a variable. // If so, we can track both its contents and constraints on its value. if (ExplodedGraph::isInterestingLValueExpr(Inner)) { SVal LVal = LVNode->getSVal(Inner); const MemRegion *RR = getLocationRegionIfReference(Inner, LVNode); bool LVIsNull = LVState->isNull(LVal).isConstrainedTrue(); // If this is a C++ reference to a null pointer, we are tracking the // pointer. In addition, we should find the store at which the reference // got initialized. if (RR && !LVIsNull) if (auto KV = LVal.getAs()) report.addVisitor(llvm::make_unique( *KV, RR, EnableNullFPSuppression)); // In case of C++ references, we want to differentiate between a null // reference and reference to null pointer. // If the LVal is null, check if we are dealing with null reference. // For those, we want to track the location of the reference. const MemRegion *R = (RR && LVIsNull) ? RR : LVNode->getSVal(Inner).getAsRegion(); if (R) { // Mark both the variable region and its contents as interesting. SVal V = LVState->getRawSVal(loc::MemRegionVal(R)); report.addVisitor( llvm::make_unique(cast(R))); MacroNullReturnSuppressionVisitor::addMacroVisitorIfNecessary( LVNode, R, EnableNullFPSuppression, report, V); report.markInteresting(V); report.addVisitor(llvm::make_unique(R)); // If the contents are symbolic, find out when they became null. if (V.getAsLocSymbol(/*IncludeBaseRegions*/ true)) report.addVisitor(llvm::make_unique( V.castAs(), false)); // Add visitor, which will suppress inline defensive checks. if (auto DV = V.getAs()) if (!DV->isZeroConstant() && LVState->isNull(*DV).isConstrainedTrue() && EnableNullFPSuppression) report.addVisitor( llvm::make_unique(*DV, LVNode)); if (auto KV = V.getAs()) report.addVisitor(llvm::make_unique( *KV, R, EnableNullFPSuppression)); return true; } } // If the expression is not an "lvalue expression", we can still // track the constraints on its contents. SVal V = LVState->getSValAsScalarOrLoc(Inner, LVNode->getLocationContext()); ReturnVisitor::addVisitorIfNecessary( LVNode, Inner, report, EnableNullFPSuppression); // Is it a symbolic value? if (auto L = V.getAs()) { report.addVisitor(llvm::make_unique(L->getRegion())); // FIXME: this is a hack for fixing a later crash when attempting to // dereference a void* pointer. // We should not try to dereference pointers at all when we don't care // what is written inside the pointer. bool CanDereference = true; if (const auto *SR = dyn_cast(L->getRegion())) if (SR->getSymbol()->getType()->getPointeeType()->isVoidType()) CanDereference = false; // At this point we are dealing with the region's LValue. // However, if the rvalue is a symbolic region, we should track it as well. // Try to use the correct type when looking up the value. SVal RVal; if (ExplodedGraph::isInterestingLValueExpr(Inner)) { RVal = LVState->getRawSVal(L.getValue(), Inner->getType()); } else if (CanDereference) { RVal = LVState->getSVal(L->getRegion()); } if (CanDereference) if (auto KV = RVal.getAs()) report.addVisitor(llvm::make_unique( *KV, L->getRegion(), EnableNullFPSuppression)); const MemRegion *RegionRVal = RVal.getAsRegion(); if (RegionRVal && isa(RegionRVal)) { report.markInteresting(RegionRVal); report.addVisitor(llvm::make_unique( loc::MemRegionVal(RegionRVal), /*assumption=*/false)); } } return true; } const Expr *NilReceiverBRVisitor::getNilReceiver(const Stmt *S, const ExplodedNode *N) { const auto *ME = dyn_cast(S); if (!ME) return nullptr; if (const Expr *Receiver = ME->getInstanceReceiver()) { ProgramStateRef state = N->getState(); SVal V = N->getSVal(Receiver); if (state->isNull(V).isConstrainedTrue()) return Receiver; } return nullptr; } std::shared_ptr NilReceiverBRVisitor::VisitNode(const ExplodedNode *N, BugReporterContext &BRC, BugReport &BR) { Optional P = N->getLocationAs(); if (!P) return nullptr; const Stmt *S = P->getStmt(); const Expr *Receiver = getNilReceiver(S, N); if (!Receiver) return nullptr; llvm::SmallString<256> Buf; llvm::raw_svector_ostream OS(Buf); if (const auto *ME = dyn_cast(S)) { OS << "'"; ME->getSelector().print(OS); OS << "' not called"; } else { OS << "No method is called"; } OS << " because the receiver is nil"; // The receiver was nil, and hence the method was skipped. // Register a BugReporterVisitor to issue a message telling us how // the receiver was null. bugreporter::trackExpressionValue(N, Receiver, BR, /*EnableNullFPSuppression*/ false); // Issue a message saying that the method was skipped. PathDiagnosticLocation L(Receiver, BRC.getSourceManager(), N->getLocationContext()); return std::make_shared(L, OS.str()); } // Registers every VarDecl inside a Stmt with a last store visitor. void FindLastStoreBRVisitor::registerStatementVarDecls(BugReport &BR, const Stmt *S, bool EnableNullFPSuppression) { const ExplodedNode *N = BR.getErrorNode(); std::deque WorkList; WorkList.push_back(S); while (!WorkList.empty()) { const Stmt *Head = WorkList.front(); WorkList.pop_front(); ProgramStateManager &StateMgr = N->getState()->getStateManager(); if (const auto *DR = dyn_cast(Head)) { if (const auto *VD = dyn_cast(DR->getDecl())) { const VarRegion *R = StateMgr.getRegionManager().getVarRegion(VD, N->getLocationContext()); // What did we load? SVal V = N->getSVal(S); if (V.getAs() || V.getAs()) { // Register a new visitor with the BugReport. BR.addVisitor(llvm::make_unique( V.castAs(), R, EnableNullFPSuppression)); } } } for (const Stmt *SubStmt : Head->children()) WorkList.push_back(SubStmt); } } //===----------------------------------------------------------------------===// // Visitor that tries to report interesting diagnostics from conditions. //===----------------------------------------------------------------------===// /// Return the tag associated with this visitor. This tag will be used /// to make all PathDiagnosticPieces created by this visitor. const char *ConditionBRVisitor::getTag() { return "ConditionBRVisitor"; } std::shared_ptr ConditionBRVisitor::VisitNode(const ExplodedNode *N, BugReporterContext &BRC, BugReport &BR) { auto piece = VisitNodeImpl(N, BRC, BR); if (piece) { piece->setTag(getTag()); if (auto *ev = dyn_cast(piece.get())) ev->setPrunable(true, /* override */ false); } return piece; } std::shared_ptr ConditionBRVisitor::VisitNodeImpl(const ExplodedNode *N, BugReporterContext &BRC, BugReport &BR) { ProgramPoint progPoint = N->getLocation(); ProgramStateRef CurrentState = N->getState(); ProgramStateRef PrevState = N->getFirstPred()->getState(); // Compare the GDMs of the state, because that is where constraints // are managed. Note that ensure that we only look at nodes that // were generated by the analyzer engine proper, not checkers. if (CurrentState->getGDM().getRoot() == PrevState->getGDM().getRoot()) return nullptr; // If an assumption was made on a branch, it should be caught // here by looking at the state transition. if (Optional BE = progPoint.getAs()) { const CFGBlock *srcBlk = BE->getSrc(); if (const Stmt *term = srcBlk->getTerminator()) return VisitTerminator(term, N, srcBlk, BE->getDst(), BR, BRC); return nullptr; } if (Optional PS = progPoint.getAs()) { const std::pair &tags = ExprEngine::geteagerlyAssumeBinOpBifurcationTags(); const ProgramPointTag *tag = PS->getTag(); if (tag == tags.first) return VisitTrueTest(cast(PS->getStmt()), true, BRC, BR, N); if (tag == tags.second) return VisitTrueTest(cast(PS->getStmt()), false, BRC, BR, N); return nullptr; } return nullptr; } std::shared_ptr ConditionBRVisitor::VisitTerminator( const Stmt *Term, const ExplodedNode *N, const CFGBlock *srcBlk, const CFGBlock *dstBlk, BugReport &R, BugReporterContext &BRC) { const Expr *Cond = nullptr; // In the code below, Term is a CFG terminator and Cond is a branch condition // expression upon which the decision is made on this terminator. // // For example, in "if (x == 0)", the "if (x == 0)" statement is a terminator, // and "x == 0" is the respective condition. // // Another example: in "if (x && y)", we've got two terminators and two // conditions due to short-circuit nature of operator "&&": // 1. The "if (x && y)" statement is a terminator, // and "y" is the respective condition. // 2. Also "x && ..." is another terminator, // and "x" is its condition. switch (Term->getStmtClass()) { // FIXME: Stmt::SwitchStmtClass is worth handling, however it is a bit // more tricky because there are more than two branches to account for. default: return nullptr; case Stmt::IfStmtClass: Cond = cast(Term)->getCond(); break; case Stmt::ConditionalOperatorClass: Cond = cast(Term)->getCond(); break; case Stmt::BinaryOperatorClass: // When we encounter a logical operator (&& or ||) as a CFG terminator, // then the condition is actually its LHS; otherwise, we'd encounter // the parent, such as if-statement, as a terminator. const auto *BO = cast(Term); assert(BO->isLogicalOp() && "CFG terminator is not a short-circuit operator!"); Cond = BO->getLHS(); break; } // However, when we encounter a logical operator as a branch condition, // then the condition is actually its RHS, because LHS would be // the condition for the logical operator terminator. while (const auto *InnerBO = dyn_cast(Cond)) { if (!InnerBO->isLogicalOp()) break; Cond = InnerBO->getRHS()->IgnoreParens(); } assert(Cond); assert(srcBlk->succ_size() == 2); const bool tookTrue = *(srcBlk->succ_begin()) == dstBlk; return VisitTrueTest(Cond, tookTrue, BRC, R, N); } std::shared_ptr ConditionBRVisitor::VisitTrueTest(const Expr *Cond, bool tookTrue, BugReporterContext &BRC, BugReport &R, const ExplodedNode *N) { // These will be modified in code below, but we need to preserve the original // values in case we want to throw the generic message. const Expr *CondTmp = Cond; bool tookTrueTmp = tookTrue; while (true) { CondTmp = CondTmp->IgnoreParenCasts(); switch (CondTmp->getStmtClass()) { default: break; case Stmt::BinaryOperatorClass: if (auto P = VisitTrueTest(Cond, cast(CondTmp), tookTrueTmp, BRC, R, N)) return P; break; case Stmt::DeclRefExprClass: if (auto P = VisitTrueTest(Cond, cast(CondTmp), tookTrueTmp, BRC, R, N)) return P; break; case Stmt::UnaryOperatorClass: { const auto *UO = cast(CondTmp); if (UO->getOpcode() == UO_LNot) { tookTrueTmp = !tookTrueTmp; CondTmp = UO->getSubExpr(); continue; } break; } } break; } // Condition too complex to explain? Just say something so that the user // knew we've made some path decision at this point. const LocationContext *LCtx = N->getLocationContext(); PathDiagnosticLocation Loc(Cond, BRC.getSourceManager(), LCtx); if (!Loc.isValid() || !Loc.asLocation().isValid()) return nullptr; return std::make_shared( Loc, tookTrue ? GenericTrueMessage : GenericFalseMessage); } bool ConditionBRVisitor::patternMatch(const Expr *Ex, const Expr *ParentEx, raw_ostream &Out, BugReporterContext &BRC, BugReport &report, const ExplodedNode *N, Optional &prunable) { const Expr *OriginalExpr = Ex; Ex = Ex->IgnoreParenCasts(); // Use heuristics to determine if Ex is a macro expending to a literal and // if so, use the macro's name. SourceLocation LocStart = Ex->getBeginLoc(); SourceLocation LocEnd = Ex->getEndLoc(); if (LocStart.isMacroID() && LocEnd.isMacroID() && (isa(Ex) || isa(Ex) || isa(Ex) || isa(Ex) || isa(Ex))) { StringRef StartName = Lexer::getImmediateMacroNameForDiagnostics(LocStart, BRC.getSourceManager(), BRC.getASTContext().getLangOpts()); StringRef EndName = Lexer::getImmediateMacroNameForDiagnostics(LocEnd, BRC.getSourceManager(), BRC.getASTContext().getLangOpts()); bool beginAndEndAreTheSameMacro = StartName.equals(EndName); bool partOfParentMacro = false; if (ParentEx->getBeginLoc().isMacroID()) { StringRef PName = Lexer::getImmediateMacroNameForDiagnostics( ParentEx->getBeginLoc(), BRC.getSourceManager(), BRC.getASTContext().getLangOpts()); partOfParentMacro = PName.equals(StartName); } if (beginAndEndAreTheSameMacro && !partOfParentMacro ) { // Get the location of the macro name as written by the caller. SourceLocation Loc = LocStart; while (LocStart.isMacroID()) { Loc = LocStart; LocStart = BRC.getSourceManager().getImmediateMacroCallerLoc(LocStart); } StringRef MacroName = Lexer::getImmediateMacroNameForDiagnostics( Loc, BRC.getSourceManager(), BRC.getASTContext().getLangOpts()); // Return the macro name. Out << MacroName; return false; } } if (const auto *DR = dyn_cast(Ex)) { const bool quotes = isa(DR->getDecl()); if (quotes) { Out << '\''; const LocationContext *LCtx = N->getLocationContext(); const ProgramState *state = N->getState().get(); if (const MemRegion *R = state->getLValue(cast(DR->getDecl()), LCtx).getAsRegion()) { if (report.isInteresting(R)) prunable = false; else { const ProgramState *state = N->getState().get(); SVal V = state->getSVal(R); if (report.isInteresting(V)) prunable = false; } } } Out << DR->getDecl()->getDeclName().getAsString(); if (quotes) Out << '\''; return quotes; } if (const auto *IL = dyn_cast(Ex)) { QualType OriginalTy = OriginalExpr->getType(); if (OriginalTy->isPointerType()) { if (IL->getValue() == 0) { Out << "null"; return false; } } else if (OriginalTy->isObjCObjectPointerType()) { if (IL->getValue() == 0) { Out << "nil"; return false; } } Out << IL->getValue(); return false; } return false; } std::shared_ptr ConditionBRVisitor::VisitTrueTest(const Expr *Cond, const BinaryOperator *BExpr, const bool tookTrue, BugReporterContext &BRC, BugReport &R, const ExplodedNode *N) { bool shouldInvert = false; Optional shouldPrune; SmallString<128> LhsString, RhsString; { llvm::raw_svector_ostream OutLHS(LhsString), OutRHS(RhsString); const bool isVarLHS = patternMatch(BExpr->getLHS(), BExpr, OutLHS, BRC, R, N, shouldPrune); const bool isVarRHS = patternMatch(BExpr->getRHS(), BExpr, OutRHS, BRC, R, N, shouldPrune); shouldInvert = !isVarLHS && isVarRHS; } BinaryOperator::Opcode Op = BExpr->getOpcode(); if (BinaryOperator::isAssignmentOp(Op)) { // For assignment operators, all that we care about is that the LHS // evaluates to "true" or "false". return VisitConditionVariable(LhsString, BExpr->getLHS(), tookTrue, BRC, R, N); } // For non-assignment operations, we require that we can understand // both the LHS and RHS. if (LhsString.empty() || RhsString.empty() || !BinaryOperator::isComparisonOp(Op) || Op == BO_Cmp) return nullptr; // Should we invert the strings if the LHS is not a variable name? SmallString<256> buf; llvm::raw_svector_ostream Out(buf); Out << "Assuming " << (shouldInvert ? RhsString : LhsString) << " is "; // Do we need to invert the opcode? if (shouldInvert) switch (Op) { default: break; case BO_LT: Op = BO_GT; break; case BO_GT: Op = BO_LT; break; case BO_LE: Op = BO_GE; break; case BO_GE: Op = BO_LE; break; } if (!tookTrue) switch (Op) { case BO_EQ: Op = BO_NE; break; case BO_NE: Op = BO_EQ; break; case BO_LT: Op = BO_GE; break; case BO_GT: Op = BO_LE; break; case BO_LE: Op = BO_GT; break; case BO_GE: Op = BO_LT; break; default: return nullptr; } switch (Op) { case BO_EQ: Out << "equal to "; break; case BO_NE: Out << "not equal to "; break; default: Out << BinaryOperator::getOpcodeStr(Op) << ' '; break; } Out << (shouldInvert ? LhsString : RhsString); const LocationContext *LCtx = N->getLocationContext(); PathDiagnosticLocation Loc(Cond, BRC.getSourceManager(), LCtx); auto event = std::make_shared(Loc, Out.str()); if (shouldPrune.hasValue()) event->setPrunable(shouldPrune.getValue()); return event; } std::shared_ptr ConditionBRVisitor::VisitConditionVariable( StringRef LhsString, const Expr *CondVarExpr, const bool tookTrue, BugReporterContext &BRC, BugReport &report, const ExplodedNode *N) { // FIXME: If there's already a constraint tracker for this variable, // we shouldn't emit anything here (c.f. the double note in // test/Analysis/inlining/path-notes.c) SmallString<256> buf; llvm::raw_svector_ostream Out(buf); Out << "Assuming " << LhsString << " is "; QualType Ty = CondVarExpr->getType(); if (Ty->isPointerType()) Out << (tookTrue ? "not null" : "null"); else if (Ty->isObjCObjectPointerType()) Out << (tookTrue ? "not nil" : "nil"); else if (Ty->isBooleanType()) Out << (tookTrue ? "true" : "false"); else if (Ty->isIntegralOrEnumerationType()) Out << (tookTrue ? "non-zero" : "zero"); else return nullptr; const LocationContext *LCtx = N->getLocationContext(); PathDiagnosticLocation Loc(CondVarExpr, BRC.getSourceManager(), LCtx); auto event = std::make_shared(Loc, Out.str()); if (const auto *DR = dyn_cast(CondVarExpr)) { if (const auto *VD = dyn_cast(DR->getDecl())) { const ProgramState *state = N->getState().get(); if (const MemRegion *R = state->getLValue(VD, LCtx).getAsRegion()) { if (report.isInteresting(R)) event->setPrunable(false); } } } return event; } std::shared_ptr ConditionBRVisitor::VisitTrueTest(const Expr *Cond, const DeclRefExpr *DR, const bool tookTrue, BugReporterContext &BRC, BugReport &report, const ExplodedNode *N) { const auto *VD = dyn_cast(DR->getDecl()); if (!VD) return nullptr; SmallString<256> Buf; llvm::raw_svector_ostream Out(Buf); Out << "Assuming '" << VD->getDeclName() << "' is "; QualType VDTy = VD->getType(); if (VDTy->isPointerType()) Out << (tookTrue ? "non-null" : "null"); else if (VDTy->isObjCObjectPointerType()) Out << (tookTrue ? "non-nil" : "nil"); else if (VDTy->isScalarType()) Out << (tookTrue ? "not equal to 0" : "0"); else return nullptr; const LocationContext *LCtx = N->getLocationContext(); PathDiagnosticLocation Loc(Cond, BRC.getSourceManager(), LCtx); auto event = std::make_shared(Loc, Out.str()); const ProgramState *state = N->getState().get(); if (const MemRegion *R = state->getLValue(VD, LCtx).getAsRegion()) { if (report.isInteresting(R)) event->setPrunable(false); else { SVal V = state->getSVal(R); if (report.isInteresting(V)) event->setPrunable(false); } } return std::move(event); } const char *const ConditionBRVisitor::GenericTrueMessage = "Assuming the condition is true"; const char *const ConditionBRVisitor::GenericFalseMessage = "Assuming the condition is false"; bool ConditionBRVisitor::isPieceMessageGeneric( const PathDiagnosticPiece *Piece) { return Piece->getString() == GenericTrueMessage || Piece->getString() == GenericFalseMessage; } void LikelyFalsePositiveSuppressionBRVisitor::finalizeVisitor( BugReporterContext &BRC, const ExplodedNode *N, BugReport &BR) { // Here we suppress false positives coming from system headers. This list is // based on known issues. AnalyzerOptions &Options = BRC.getAnalyzerOptions(); const Decl *D = N->getLocationContext()->getDecl(); if (AnalysisDeclContext::isInStdNamespace(D)) { // Skip reports within the 'std' namespace. Although these can sometimes be // the user's fault, we currently don't report them very well, and // Note that this will not help for any other data structure libraries, like // TR1, Boost, or llvm/ADT. if (Options.ShouldSuppressFromCXXStandardLibrary) { BR.markInvalid(getTag(), nullptr); return; } else { // If the complete 'std' suppression is not enabled, suppress reports // from the 'std' namespace that are known to produce false positives. // The analyzer issues a false use-after-free when std::list::pop_front // or std::list::pop_back are called multiple times because we cannot // reason about the internal invariants of the data structure. if (const auto *MD = dyn_cast(D)) { const CXXRecordDecl *CD = MD->getParent(); if (CD->getName() == "list") { BR.markInvalid(getTag(), nullptr); return; } } // The analyzer issues a false positive when the constructor of // std::__independent_bits_engine from algorithms is used. if (const auto *MD = dyn_cast(D)) { const CXXRecordDecl *CD = MD->getParent(); if (CD->getName() == "__independent_bits_engine") { BR.markInvalid(getTag(), nullptr); return; } } for (const LocationContext *LCtx = N->getLocationContext(); LCtx; LCtx = LCtx->getParent()) { const auto *MD = dyn_cast(LCtx->getDecl()); if (!MD) continue; const CXXRecordDecl *CD = MD->getParent(); // The analyzer issues a false positive on // std::basic_string v; v.push_back(1); // and // std::u16string s; s += u'a'; // because we cannot reason about the internal invariants of the // data structure. if (CD->getName() == "basic_string") { BR.markInvalid(getTag(), nullptr); return; } // The analyzer issues a false positive on // std::shared_ptr p(new int(1)); p = nullptr; // because it does not reason properly about temporary destructors. if (CD->getName() == "shared_ptr") { BR.markInvalid(getTag(), nullptr); return; } } } } // Skip reports within the sys/queue.h macros as we do not have the ability to // reason about data structure shapes. SourceManager &SM = BRC.getSourceManager(); FullSourceLoc Loc = BR.getLocation(SM).asLocation(); while (Loc.isMacroID()) { Loc = Loc.getSpellingLoc(); if (SM.getFilename(Loc).endswith("sys/queue.h")) { BR.markInvalid(getTag(), nullptr); return; } } } std::shared_ptr UndefOrNullArgVisitor::VisitNode(const ExplodedNode *N, BugReporterContext &BRC, BugReport &BR) { ProgramStateRef State = N->getState(); ProgramPoint ProgLoc = N->getLocation(); // We are only interested in visiting CallEnter nodes. Optional CEnter = ProgLoc.getAs(); if (!CEnter) return nullptr; // Check if one of the arguments is the region the visitor is tracking. CallEventManager &CEMgr = BRC.getStateManager().getCallEventManager(); CallEventRef<> Call = CEMgr.getCaller(CEnter->getCalleeContext(), State); unsigned Idx = 0; ArrayRef parms = Call->parameters(); for (const auto ParamDecl : parms) { const MemRegion *ArgReg = Call->getArgSVal(Idx).getAsRegion(); ++Idx; // Are we tracking the argument or its subregion? if ( !ArgReg || !R->isSubRegionOf(ArgReg->StripCasts())) continue; // Check the function parameter type. assert(ParamDecl && "Formal parameter has no decl?"); QualType T = ParamDecl->getType(); if (!(T->isAnyPointerType() || T->isReferenceType())) { // Function can only change the value passed in by address. continue; } // If it is a const pointer value, the function does not intend to // change the value. if (T->getPointeeType().isConstQualified()) continue; // Mark the call site (LocationContext) as interesting if the value of the // argument is undefined or '0'/'NULL'. SVal BoundVal = State->getSVal(R); if (BoundVal.isUndef() || BoundVal.isZeroConstant()) { BR.markInteresting(CEnter->getCalleeContext()); return nullptr; } } return nullptr; } std::shared_ptr CXXSelfAssignmentBRVisitor::VisitNode(const ExplodedNode *Succ, BugReporterContext &BRC, BugReport &) { if (Satisfied) return nullptr; const auto Edge = Succ->getLocation().getAs(); if (!Edge.hasValue()) return nullptr; auto Tag = Edge->getTag(); if (!Tag) return nullptr; if (Tag->getTagDescription() != "cplusplus.SelfAssignment") return nullptr; Satisfied = true; const auto *Met = dyn_cast(Succ->getCodeDecl().getAsFunction()); assert(Met && "Not a C++ method."); assert((Met->isCopyAssignmentOperator() || Met->isMoveAssignmentOperator()) && "Not a copy/move assignment operator."); const auto *LCtx = Edge->getLocationContext(); const auto &State = Succ->getState(); auto &SVB = State->getStateManager().getSValBuilder(); const auto Param = State->getSVal(State->getRegion(Met->getParamDecl(0), LCtx)); const auto This = State->getSVal(SVB.getCXXThis(Met, LCtx->getStackFrame())); auto L = PathDiagnosticLocation::create(Met, BRC.getSourceManager()); if (!L.isValid() || !L.asLocation().isValid()) return nullptr; SmallString<256> Buf; llvm::raw_svector_ostream Out(Buf); Out << "Assuming " << Met->getParamDecl(0)->getName() << ((Param == This) ? " == " : " != ") << "*this"; auto Piece = std::make_shared(L, Out.str()); Piece->addRange(Met->getSourceRange()); return std::move(Piece); } std::shared_ptr TaintBugVisitor::VisitNode(const ExplodedNode *N, BugReporterContext &BRC, BugReport &) { // Find the ExplodedNode where the taint was first introduced if (!N->getState()->isTainted(V) || N->getFirstPred()->getState()->isTainted(V)) return nullptr; const Stmt *S = PathDiagnosticLocation::getStmt(N); if (!S) return nullptr; const LocationContext *NCtx = N->getLocationContext(); PathDiagnosticLocation L = PathDiagnosticLocation::createBegin(S, BRC.getSourceManager(), NCtx); if (!L.isValid() || !L.asLocation().isValid()) return nullptr; return std::make_shared(L, "Taint originated here"); } FalsePositiveRefutationBRVisitor::FalsePositiveRefutationBRVisitor() : Constraints(ConstraintRangeTy::Factory().getEmptyMap()) {} void FalsePositiveRefutationBRVisitor::finalizeVisitor( BugReporterContext &BRC, const ExplodedNode *EndPathNode, BugReport &BR) { // Collect new constraints VisitNode(EndPathNode, BRC, BR); // Create a refutation manager SMTSolverRef RefutationSolver = CreateZ3Solver(); ASTContext &Ctx = BRC.getASTContext(); // Add constraints to the solver for (const auto &I : Constraints) { const SymbolRef Sym = I.first; auto RangeIt = I.second.begin(); SMTExprRef Constraints = SMTConv::getRangeExpr( RefutationSolver, Ctx, Sym, RangeIt->From(), RangeIt->To(), /*InRange=*/true); while ((++RangeIt) != I.second.end()) { Constraints = RefutationSolver->mkOr( Constraints, SMTConv::getRangeExpr(RefutationSolver, Ctx, Sym, RangeIt->From(), RangeIt->To(), /*InRange=*/true)); } RefutationSolver->addConstraint(Constraints); } // And check for satisfiability Optional isSat = RefutationSolver->check(); if (!isSat.hasValue()) return; if (!isSat.getValue()) BR.markInvalid("Infeasible constraints", EndPathNode->getLocationContext()); } std::shared_ptr FalsePositiveRefutationBRVisitor::VisitNode(const ExplodedNode *N, BugReporterContext &, BugReport &) { // Collect new constraints const ConstraintRangeTy &NewCs = N->getState()->get(); ConstraintRangeTy::Factory &CF = N->getState()->get_context(); // Add constraints if we don't have them yet for (auto const &C : NewCs) { const SymbolRef &Sym = C.first; if (!Constraints.contains(Sym)) { Constraints = CF.add(Constraints, Sym, C.second); } } return nullptr; } void FalsePositiveRefutationBRVisitor::Profile( llvm::FoldingSetNodeID &ID) const { static int Tag = 0; ID.AddPointer(&Tag); }