//== RegionStore.cpp - Field-sensitive store model --------------*- C++ -*--==// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This file defines a basic region store model. In this model, we do have field // sensitivity. But we assume nothing about the heap shape. So recursive data // structures are largely ignored. Basically we do 1-limiting analysis. // Parameter pointers are assumed with no aliasing. Pointee objects of // parameters are created lazily. // //===----------------------------------------------------------------------===// #include "clang/Analysis/PathSensitive/MemRegion.h" #include "clang/Analysis/PathSensitive/AnalysisContext.h" #include "clang/Analysis/PathSensitive/GRState.h" #include "clang/Analysis/PathSensitive/GRStateTrait.h" #include "clang/Analysis/Analyses/LiveVariables.h" #include "clang/Analysis/Support/Optional.h" #include "clang/Basic/TargetInfo.h" #include "llvm/ADT/ImmutableMap.h" #include "llvm/ADT/ImmutableList.h" #include "llvm/Support/raw_ostream.h" #include "llvm/Support/Compiler.h" using namespace clang; #define HEAP_UNDEFINED 0 #define USE_EXPLICIT_COMPOUND 0 // Actual Store type. typedef llvm::ImmutableMap RegionBindings; //===----------------------------------------------------------------------===// // Fine-grained control of RegionStoreManager. //===----------------------------------------------------------------------===// namespace { struct VISIBILITY_HIDDEN minimal_features_tag {}; struct VISIBILITY_HIDDEN maximal_features_tag {}; class VISIBILITY_HIDDEN RegionStoreFeatures { bool SupportsFields; bool SupportsRemaining; public: RegionStoreFeatures(minimal_features_tag) : SupportsFields(false), SupportsRemaining(false) {} RegionStoreFeatures(maximal_features_tag) : SupportsFields(true), SupportsRemaining(false) {} void enableFields(bool t) { SupportsFields = t; } bool supportsFields() const { return SupportsFields; } bool supportsRemaining() const { return SupportsRemaining; } }; } //===----------------------------------------------------------------------===// // Region "Extents" //===----------------------------------------------------------------------===// // // MemRegions represent chunks of memory with a size (their "extent"). This // GDM entry tracks the extents for regions. Extents are in bytes. // namespace { class VISIBILITY_HIDDEN RegionExtents {}; } static int RegionExtentsIndex = 0; namespace clang { template<> struct GRStateTrait : public GRStatePartialTrait > { static void* GDMIndex() { return &RegionExtentsIndex; } }; } //===----------------------------------------------------------------------===// // Regions with default values. //===----------------------------------------------------------------------===// // // This GDM entry tracks what regions have a default value if they have no bound // value and have not been killed. // namespace { class VISIBILITY_HIDDEN RegionDefaultValue { public: typedef llvm::ImmutableMap MapTy; }; } static int RegionDefaultValueIndex = 0; namespace clang { template<> struct GRStateTrait : public GRStatePartialTrait { static void* GDMIndex() { return &RegionDefaultValueIndex; } }; } typedef RegionDefaultValue::MapTy RegionDefaultBindings; //===----------------------------------------------------------------------===// // Utility functions. //===----------------------------------------------------------------------===// static bool IsAnyPointerOrIntptr(QualType ty, ASTContext &Ctx) { if (ty->isAnyPointerType()) return true; return ty->isIntegerType() && ty->isScalarType() && Ctx.getTypeSize(ty) == Ctx.getTypeSize(Ctx.VoidPtrTy); } //===----------------------------------------------------------------------===// // Main RegionStore logic. //===----------------------------------------------------------------------===// namespace { class VISIBILITY_HIDDEN RegionStoreSubRegionMap : public SubRegionMap { typedef llvm::ImmutableSet SetTy; typedef llvm::DenseMap Map; SetTy::Factory F; Map M; public: bool add(const MemRegion* Parent, const MemRegion* SubRegion) { Map::iterator I = M.find(Parent); if (I == M.end()) { M.insert(std::make_pair(Parent, F.Add(F.GetEmptySet(), SubRegion))); return true; } I->second = F.Add(I->second, SubRegion); return false; } void process(llvm::SmallVectorImpl &WL, const SubRegion *R); ~RegionStoreSubRegionMap() {} bool iterSubRegions(const MemRegion* Parent, Visitor& V) const { Map::iterator I = M.find(Parent); if (I == M.end()) return true; llvm::ImmutableSet S = I->second; for (llvm::ImmutableSet::iterator SI=S.begin(),SE=S.end(); SI != SE; ++SI) { if (!V.Visit(Parent, *SI)) return false; } return true; } typedef SetTy::iterator iterator; std::pair begin_end(const MemRegion *R) { Map::iterator I = M.find(R); SetTy S = I == M.end() ? F.GetEmptySet() : I->second; return std::make_pair(S.begin(), S.end()); } }; class VISIBILITY_HIDDEN RegionStoreManager : public StoreManager { const RegionStoreFeatures Features; RegionBindings::Factory RBFactory; public: RegionStoreManager(GRStateManager& mgr, const RegionStoreFeatures &f) : StoreManager(mgr), Features(f), RBFactory(mgr.getAllocator()) {} virtual ~RegionStoreManager() {} SubRegionMap *getSubRegionMap(const GRState *state); RegionStoreSubRegionMap *getRegionStoreSubRegionMap(const GRState *state); /// getDefaultBinding - Returns an SVal* representing an optional default /// binding associated with a region and its subregions. Optional getDefaultBinding(const GRState *state, const MemRegion *R); /// getLValueString - Returns an SVal representing the lvalue of a /// StringLiteral. Within RegionStore a StringLiteral has an /// associated StringRegion, and the lvalue of a StringLiteral is /// the lvalue of that region. SVal getLValueString(const GRState *state, const StringLiteral* S); /// getLValueCompoundLiteral - Returns an SVal representing the /// lvalue of a compound literal. Within RegionStore a compound /// literal has an associated region, and the lvalue of the /// compound literal is the lvalue of that region. SVal getLValueCompoundLiteral(const GRState *state, const CompoundLiteralExpr*); /// getLValueVar - Returns an SVal that represents the lvalue of a /// variable. Within RegionStore a variable has an associated /// VarRegion, and the lvalue of the variable is the lvalue of that region. SVal getLValueVar(const GRState *ST, const VarDecl *VD, const LocationContext *LC); SVal getLValueIvar(const GRState *state, const ObjCIvarDecl* D, SVal Base); SVal getLValueField(const GRState *state, SVal Base, const FieldDecl* D); SVal getLValueFieldOrIvar(const GRState *state, SVal Base, const Decl* D); SVal getLValueElement(const GRState *state, QualType elementType, SVal Base, SVal Offset); /// ArrayToPointer - Emulates the "decay" of an array to a pointer /// type. 'Array' represents the lvalue of the array being decayed /// to a pointer, and the returned SVal represents the decayed /// version of that lvalue (i.e., a pointer to the first element of /// the array). This is called by GRExprEngine when evaluating /// casts from arrays to pointers. SVal ArrayToPointer(Loc Array); SVal EvalBinOp(const GRState *state, BinaryOperator::Opcode Op,Loc L, NonLoc R, QualType resultTy); Store getInitialStore(const LocationContext *InitLoc) { return RBFactory.GetEmptyMap().getRoot(); } //===-------------------------------------------------------------------===// // Binding values to regions. //===-------------------------------------------------------------------===// const GRState *InvalidateRegion(const GRState *state, const MemRegion *R, const Expr *E, unsigned Count); private: void RemoveSubRegionBindings(RegionBindings &B, RegionDefaultBindings &DVM, RegionDefaultBindings::Factory &DVMFactory, const MemRegion *R, RegionStoreSubRegionMap &M); public: const GRState *Bind(const GRState *state, Loc LV, SVal V); const GRState *BindCompoundLiteral(const GRState *state, const CompoundLiteralExpr* CL, SVal V); const GRState *BindDecl(const GRState *ST, const VarDecl *VD, const LocationContext *LC, SVal InitVal); const GRState *BindDeclWithNoInit(const GRState *state, const VarDecl*, const LocationContext *) { return state; } /// BindStruct - Bind a compound value to a structure. const GRState *BindStruct(const GRState *, const TypedRegion* R, SVal V); const GRState *BindArray(const GRState *state, const TypedRegion* R, SVal V); /// KillStruct - Set the entire struct to unknown. const GRState *KillStruct(const GRState *state, const TypedRegion* R); const GRState *setDefaultValue(const GRState *state, const MemRegion* R, SVal V); Store Remove(Store store, Loc LV); //===------------------------------------------------------------------===// // Loading values from regions. //===------------------------------------------------------------------===// /// The high level logic for this method is this: /// Retrieve (L) /// if L has binding /// return L's binding /// else if L is in killset /// return unknown /// else /// if L is on stack or heap /// return undefined /// else /// return symbolic SValuator::CastResult Retrieve(const GRState *state, Loc L, QualType T = QualType()); SVal RetrieveElement(const GRState *state, const ElementRegion *R); SVal RetrieveField(const GRState *state, const FieldRegion *R); SVal RetrieveObjCIvar(const GRState *state, const ObjCIvarRegion *R); SVal RetrieveVar(const GRState *state, const VarRegion *R); SVal RetrieveLazySymbol(const GRState *state, const TypedRegion *R); SVal RetrieveFieldOrElementCommon(const GRState *state, const TypedRegion *R, QualType Ty, const MemRegion *superR); SValuator::CastResult CastRetrievedVal(SVal val, const GRState *state, const TypedRegion *R, QualType castTy); /// Retrieve the values in a struct and return a CompoundVal, used when doing /// struct copy: /// struct s x, y; /// x = y; /// y's value is retrieved by this method. SVal RetrieveStruct(const GRState *St, const TypedRegion* R); SVal RetrieveArray(const GRState *St, const TypedRegion* R); std::pair GetLazyBinding(RegionBindings B, const MemRegion *R); const GRState* CopyLazyBindings(nonloc::LazyCompoundVal V, const GRState *state, const TypedRegion *R); //===------------------------------------------------------------------===// // State pruning. //===------------------------------------------------------------------===// /// RemoveDeadBindings - Scans the RegionStore of 'state' for dead values. /// It returns a new Store with these values removed. void RemoveDeadBindings(GRState &state, Stmt* Loc, SymbolReaper& SymReaper, llvm::SmallVectorImpl& RegionRoots); //===------------------------------------------------------------------===// // Region "extents". //===------------------------------------------------------------------===// const GRState *setExtent(const GRState *state, const MemRegion* R, SVal Extent); SVal getSizeInElements(const GRState *state, const MemRegion* R); //===------------------------------------------------------------------===// // Utility methods. //===------------------------------------------------------------------===// static inline RegionBindings GetRegionBindings(Store store) { return RegionBindings(static_cast(store)); } void print(Store store, llvm::raw_ostream& Out, const char* nl, const char *sep); void iterBindings(Store store, BindingsHandler& f) { // FIXME: Implement. } // FIXME: Remove. BasicValueFactory& getBasicVals() { return StateMgr.getBasicVals(); } // FIXME: Remove. ASTContext& getContext() { return StateMgr.getContext(); } }; } // end anonymous namespace //===----------------------------------------------------------------------===// // RegionStore creation. //===----------------------------------------------------------------------===// StoreManager *clang::CreateRegionStoreManager(GRStateManager& StMgr) { RegionStoreFeatures F = maximal_features_tag(); return new RegionStoreManager(StMgr, F); } StoreManager *clang::CreateFieldsOnlyRegionStoreManager(GRStateManager &StMgr) { RegionStoreFeatures F = minimal_features_tag(); F.enableFields(true); return new RegionStoreManager(StMgr, F); } void RegionStoreSubRegionMap::process(llvm::SmallVectorImpl &WL, const SubRegion *R) { const MemRegion *superR = R->getSuperRegion(); if (add(superR, R)) if (const SubRegion *sr = dyn_cast(superR)) WL.push_back(sr); } RegionStoreSubRegionMap* RegionStoreManager::getRegionStoreSubRegionMap(const GRState *state) { RegionBindings B = GetRegionBindings(state->getStore()); RegionStoreSubRegionMap *M = new RegionStoreSubRegionMap(); llvm::SmallVector WL; for (RegionBindings::iterator I=B.begin(), E=B.end(); I!=E; ++I) if (const SubRegion *R = dyn_cast(I.getKey())) M->process(WL, R); RegionDefaultBindings DVM = state->get(); for (RegionDefaultBindings::iterator I = DVM.begin(), E = DVM.end(); I != E; ++I) if (const SubRegion *R = dyn_cast(I.getKey())) M->process(WL, R); // We also need to record in the subregion map "intermediate" regions that // don't have direct bindings but are super regions of those that do. while (!WL.empty()) { const SubRegion *R = WL.back(); WL.pop_back(); M->process(WL, R); } return M; } SubRegionMap *RegionStoreManager::getSubRegionMap(const GRState *state) { return getRegionStoreSubRegionMap(state); } //===----------------------------------------------------------------------===// // Binding invalidation. //===----------------------------------------------------------------------===// void RegionStoreManager::RemoveSubRegionBindings(RegionBindings &B, RegionDefaultBindings &DVM, RegionDefaultBindings::Factory &DVMFactory, const MemRegion *R, RegionStoreSubRegionMap &M) { RegionStoreSubRegionMap::iterator I, E; for (llvm::tie(I, E) = M.begin_end(R); I != E; ++I) RemoveSubRegionBindings(B, DVM, DVMFactory, *I, M); B = RBFactory.Remove(B, R); DVM = DVMFactory.Remove(DVM, R); } const GRState *RegionStoreManager::InvalidateRegion(const GRState *state, const MemRegion *R, const Expr *E, unsigned Count) { ASTContext& Ctx = StateMgr.getContext(); // Strip away casts. R = R->getBaseRegion(); // Remove the bindings to subregions. { // Get the mapping of regions -> subregions. llvm::OwningPtr SubRegions(getRegionStoreSubRegionMap(state)); RegionBindings B = GetRegionBindings(state->getStore()); RegionDefaultBindings DVM = state->get(); RegionDefaultBindings::Factory &DVMFactory = state->get_context(); RemoveSubRegionBindings(B, DVM, DVMFactory, R, *SubRegions.get()); state = state->makeWithStore(B.getRoot())->set(DVM); } if (!R->isBoundable()) return state; if (isa(R) || isa(R) || isa(R)) { // Invalidate the region by setting its default value to // conjured symbol. The type of the symbol is irrelavant. SVal V = ValMgr.getConjuredSymbolVal(E, Ctx.IntTy, Count); return setDefaultValue(state, R, V); } const TypedRegion *TR = cast(R); QualType T = TR->getValueType(Ctx); if (const RecordType *RT = T->getAsStructureType()) { // FIXME: handle structs with default region value. const RecordDecl *RD = RT->getDecl()->getDefinition(Ctx); // No record definition. There is nothing we can do. if (!RD) return state; // Invalidate the region by setting its default value to // conjured symbol. The type of the symbol is irrelavant. SVal V = ValMgr.getConjuredSymbolVal(E, Ctx.IntTy, Count); return setDefaultValue(state, R, V); } if (const ArrayType *AT = Ctx.getAsArrayType(T)) { // Set the default value of the array to conjured symbol. SVal V = ValMgr.getConjuredSymbolVal(E, AT->getElementType(), Count); return setDefaultValue(state, TR, V); } SVal V = ValMgr.getConjuredSymbolVal(E, T, Count); assert(SymbolManager::canSymbolicate(T) || V.isUnknown()); return Bind(state, ValMgr.makeLoc(TR), V); } //===----------------------------------------------------------------------===// // getLValueXXX methods. //===----------------------------------------------------------------------===// /// getLValueString - Returns an SVal representing the lvalue of a /// StringLiteral. Within RegionStore a StringLiteral has an /// associated StringRegion, and the lvalue of a StringLiteral is the /// lvalue of that region. SVal RegionStoreManager::getLValueString(const GRState *St, const StringLiteral* S) { return loc::MemRegionVal(MRMgr.getStringRegion(S)); } /// getLValueVar - Returns an SVal that represents the lvalue of a /// variable. Within RegionStore a variable has an associated /// VarRegion, and the lvalue of the variable is the lvalue of that region. SVal RegionStoreManager::getLValueVar(const GRState *ST, const VarDecl *VD, const LocationContext *LC) { return loc::MemRegionVal(MRMgr.getVarRegion(VD, LC)); } /// getLValueCompoundLiteral - Returns an SVal representing the lvalue /// of a compound literal. Within RegionStore a compound literal /// has an associated region, and the lvalue of the compound literal /// is the lvalue of that region. SVal RegionStoreManager::getLValueCompoundLiteral(const GRState *St, const CompoundLiteralExpr* CL) { return loc::MemRegionVal(MRMgr.getCompoundLiteralRegion(CL)); } SVal RegionStoreManager::getLValueIvar(const GRState *St, const ObjCIvarDecl* D, SVal Base) { return getLValueFieldOrIvar(St, Base, D); } SVal RegionStoreManager::getLValueField(const GRState *St, SVal Base, const FieldDecl* D) { return getLValueFieldOrIvar(St, Base, D); } SVal RegionStoreManager::getLValueFieldOrIvar(const GRState *St, SVal Base, const Decl* D) { if (Base.isUnknownOrUndef()) return Base; Loc BaseL = cast(Base); const MemRegion* BaseR = 0; switch (BaseL.getSubKind()) { case loc::MemRegionKind: BaseR = cast(BaseL).getRegion(); break; case loc::GotoLabelKind: // These are anormal cases. Flag an undefined value. return UndefinedVal(); case loc::ConcreteIntKind: // While these seem funny, this can happen through casts. // FIXME: What we should return is the field offset. For example, // add the field offset to the integer value. That way funny things // like this work properly: &(((struct foo *) 0xa)->f) return Base; default: assert(0 && "Unhandled Base."); return Base; } // NOTE: We must have this check first because ObjCIvarDecl is a subclass // of FieldDecl. if (const ObjCIvarDecl *ID = dyn_cast(D)) return loc::MemRegionVal(MRMgr.getObjCIvarRegion(ID, BaseR)); return loc::MemRegionVal(MRMgr.getFieldRegion(cast(D), BaseR)); } SVal RegionStoreManager::getLValueElement(const GRState *St, QualType elementType, SVal Base, SVal Offset) { // If the base is an unknown or undefined value, just return it back. // FIXME: For absolute pointer addresses, we just return that value back as // well, although in reality we should return the offset added to that // value. if (Base.isUnknownOrUndef() || isa(Base)) return Base; // Only handle integer offsets... for now. if (!isa(Offset)) return UnknownVal(); const MemRegion* BaseRegion = cast(Base).getRegion(); // Pointer of any type can be cast and used as array base. const ElementRegion *ElemR = dyn_cast(BaseRegion); // Convert the offset to the appropriate size and signedness. Offset = ValMgr.convertToArrayIndex(Offset); if (!ElemR) { // // If the base region is not an ElementRegion, create one. // This can happen in the following example: // // char *p = __builtin_alloc(10); // p[1] = 8; // // Observe that 'p' binds to an AllocaRegion. // return loc::MemRegionVal(MRMgr.getElementRegion(elementType, Offset, BaseRegion, getContext())); } SVal BaseIdx = ElemR->getIndex(); if (!isa(BaseIdx)) return UnknownVal(); const llvm::APSInt& BaseIdxI = cast(BaseIdx).getValue(); const llvm::APSInt& OffI = cast(Offset).getValue(); assert(BaseIdxI.isSigned()); // Compute the new index. SVal NewIdx = nonloc::ConcreteInt(getBasicVals().getValue(BaseIdxI + OffI)); // Construct the new ElementRegion. const MemRegion *ArrayR = ElemR->getSuperRegion(); return loc::MemRegionVal(MRMgr.getElementRegion(elementType, NewIdx, ArrayR, getContext())); } //===----------------------------------------------------------------------===// // Extents for regions. //===----------------------------------------------------------------------===// SVal RegionStoreManager::getSizeInElements(const GRState *state, const MemRegion *R) { switch (R->getKind()) { case MemRegion::MemSpaceRegionKind: assert(0 && "Cannot index into a MemSpace"); return UnknownVal(); case MemRegion::CodeTextRegionKind: // Technically this can happen if people do funny things with casts. return UnknownVal(); // Not yet handled. case MemRegion::AllocaRegionKind: case MemRegion::CompoundLiteralRegionKind: case MemRegion::ElementRegionKind: case MemRegion::FieldRegionKind: case MemRegion::ObjCIvarRegionKind: case MemRegion::ObjCObjectRegionKind: case MemRegion::SymbolicRegionKind: return UnknownVal(); case MemRegion::StringRegionKind: { const StringLiteral* Str = cast(R)->getStringLiteral(); // We intentionally made the size value signed because it participates in // operations with signed indices. return ValMgr.makeIntVal(Str->getByteLength()+1, false); } case MemRegion::VarRegionKind: { const VarRegion* VR = cast(R); // Get the type of the variable. QualType T = VR->getDesugaredValueType(getContext()); // FIXME: Handle variable-length arrays. if (isa(T)) return UnknownVal(); if (const ConstantArrayType* CAT = dyn_cast(T)) { // return the size as signed integer. return ValMgr.makeIntVal(CAT->getSize(), false); } // Clients can use ordinary variables as if they were arrays. These // essentially are arrays of size 1. return ValMgr.makeIntVal(1, false); } case MemRegion::BEG_DECL_REGIONS: case MemRegion::END_DECL_REGIONS: case MemRegion::BEG_TYPED_REGIONS: case MemRegion::END_TYPED_REGIONS: assert(0 && "Infeasible region"); return UnknownVal(); } assert(0 && "Unreachable"); return UnknownVal(); } const GRState *RegionStoreManager::setExtent(const GRState *state, const MemRegion *region, SVal extent) { return state->set(region, extent); } //===----------------------------------------------------------------------===// // Location and region casting. //===----------------------------------------------------------------------===// /// ArrayToPointer - Emulates the "decay" of an array to a pointer /// type. 'Array' represents the lvalue of the array being decayed /// to a pointer, and the returned SVal represents the decayed /// version of that lvalue (i.e., a pointer to the first element of /// the array). This is called by GRExprEngine when evaluating casts /// from arrays to pointers. SVal RegionStoreManager::ArrayToPointer(Loc Array) { if (!isa(Array)) return UnknownVal(); const MemRegion* R = cast(&Array)->getRegion(); const TypedRegion* ArrayR = dyn_cast(R); if (!ArrayR) return UnknownVal(); // Strip off typedefs from the ArrayRegion's ValueType. QualType T = ArrayR->getValueType(getContext())->getDesugaredType(); ArrayType *AT = cast(T); T = AT->getElementType(); SVal ZeroIdx = ValMgr.makeZeroArrayIndex(); ElementRegion* ER = MRMgr.getElementRegion(T, ZeroIdx, ArrayR, getContext()); return loc::MemRegionVal(ER); } //===----------------------------------------------------------------------===// // Pointer arithmetic. //===----------------------------------------------------------------------===// SVal RegionStoreManager::EvalBinOp(const GRState *state, BinaryOperator::Opcode Op, Loc L, NonLoc R, QualType resultTy) { // Assume the base location is MemRegionVal. if (!isa(L)) return UnknownVal(); const MemRegion* MR = cast(L).getRegion(); const ElementRegion *ER = 0; switch (MR->getKind()) { case MemRegion::SymbolicRegionKind: { const SymbolicRegion *SR = cast(MR); SymbolRef Sym = SR->getSymbol(); QualType T = Sym->getType(getContext()); QualType EleTy = T->getAs()->getPointeeType(); SVal ZeroIdx = ValMgr.makeZeroArrayIndex(); ER = MRMgr.getElementRegion(EleTy, ZeroIdx, SR, getContext()); break; } case MemRegion::AllocaRegionKind: { const AllocaRegion *AR = cast(MR); QualType T = getContext().CharTy; // Create an ElementRegion of bytes. QualType EleTy = T->getAs()->getPointeeType(); SVal ZeroIdx = ValMgr.makeZeroArrayIndex(); ER = MRMgr.getElementRegion(EleTy, ZeroIdx, AR, getContext()); break; } case MemRegion::ElementRegionKind: { ER = cast(MR); break; } // Not yet handled. case MemRegion::VarRegionKind: case MemRegion::StringRegionKind: case MemRegion::CompoundLiteralRegionKind: case MemRegion::FieldRegionKind: case MemRegion::ObjCObjectRegionKind: case MemRegion::ObjCIvarRegionKind: return UnknownVal(); case MemRegion::CodeTextRegionKind: // Technically this can happen if people do funny things with casts. return UnknownVal(); case MemRegion::MemSpaceRegionKind: assert(0 && "Cannot perform pointer arithmetic on a MemSpace"); return UnknownVal(); case MemRegion::BEG_DECL_REGIONS: case MemRegion::END_DECL_REGIONS: case MemRegion::BEG_TYPED_REGIONS: case MemRegion::END_TYPED_REGIONS: assert(0 && "Infeasible region"); return UnknownVal(); } SVal Idx = ER->getIndex(); nonloc::ConcreteInt* Base = dyn_cast(&Idx); nonloc::ConcreteInt* Offset = dyn_cast(&R); // Only support concrete integer indexes for now. if (Base && Offset) { // FIXME: Should use SValuator here. SVal NewIdx = Base->evalBinOp(ValMgr, Op, cast(ValMgr.convertToArrayIndex(*Offset))); const MemRegion* NewER = MRMgr.getElementRegion(ER->getElementType(), NewIdx, ER->getSuperRegion(), getContext()); return ValMgr.makeLoc(NewER); } return UnknownVal(); } //===----------------------------------------------------------------------===// // Loading values from regions. //===----------------------------------------------------------------------===// Optional RegionStoreManager::getDefaultBinding(const GRState *state, const MemRegion *R) { if (R->isBoundable()) if (const TypedRegion *TR = dyn_cast(R)) if (TR->getValueType(getContext())->isUnionType()) return UnknownVal(); return Optional::create(state->get(R)); } static bool IsReinterpreted(QualType RTy, QualType UsedTy, ASTContext &Ctx) { RTy = Ctx.getCanonicalType(RTy); UsedTy = Ctx.getCanonicalType(UsedTy); if (RTy == UsedTy) return false; // Recursively check the types. We basically want to see if a pointer value // is ever reinterpreted as a non-pointer, e.g. void** and intptr_t* // represents a reinterpretation. if (Loc::IsLocType(RTy) && Loc::IsLocType(UsedTy)) { const PointerType *PRTy = RTy->getAs(); const PointerType *PUsedTy = UsedTy->getAs(); return PUsedTy && PRTy && IsReinterpreted(PRTy->getPointeeType(), PUsedTy->getPointeeType(), Ctx); } return true; } SValuator::CastResult RegionStoreManager::Retrieve(const GRState *state, Loc L, QualType T) { assert(!isa(L) && "location unknown"); assert(!isa(L) && "location undefined"); // FIXME: Is this even possible? Shouldn't this be treated as a null // dereference at a higher level? if (isa(L)) return SValuator::CastResult(state, UndefinedVal()); const MemRegion *MR = cast(L).getRegion(); // FIXME: return symbolic value for these cases. // Example: // void f(int* p) { int x = *p; } // char* p = alloca(); // read(p); // c = *p; if (isa(MR)) return SValuator::CastResult(state, UnknownVal()); if (isa(MR)) { ASTContext &Ctx = getContext(); SVal idx = ValMgr.makeZeroArrayIndex(); assert(!T.isNull()); MR = MRMgr.getElementRegion(T, idx, MR, Ctx); } if (isa(MR)) return SValuator::CastResult(state, UnknownVal()); // FIXME: Perhaps this method should just take a 'const MemRegion*' argument // instead of 'Loc', and have the other Loc cases handled at a higher level. const TypedRegion *R = cast(MR); QualType RTy = R->getValueType(getContext()); // FIXME: We should eventually handle funny addressing. e.g.: // // int x = ...; // int *p = &x; // char *q = (char*) p; // char c = *q; // returns the first byte of 'x'. // // Such funny addressing will occur due to layering of regions. #if 0 ASTContext &Ctx = getContext(); if (!T.isNull() && IsReinterpreted(RTy, T, Ctx)) { SVal ZeroIdx = ValMgr.makeZeroArrayIndex(); R = MRMgr.getElementRegion(T, ZeroIdx, R, Ctx); RTy = T; assert(Ctx.getCanonicalType(RTy) == Ctx.getCanonicalType(R->getValueType(Ctx))); } #endif if (RTy->isStructureType()) return SValuator::CastResult(state, RetrieveStruct(state, R)); // FIXME: Handle unions. if (RTy->isUnionType()) return SValuator::CastResult(state, UnknownVal()); if (RTy->isArrayType()) return SValuator::CastResult(state, RetrieveArray(state, R)); // FIXME: handle Vector types. if (RTy->isVectorType()) return SValuator::CastResult(state, UnknownVal()); if (const FieldRegion* FR = dyn_cast(R)) return CastRetrievedVal(RetrieveField(state, FR), state, FR, T); if (const ElementRegion* ER = dyn_cast(R)) return CastRetrievedVal(RetrieveElement(state, ER), state, ER, T); if (const ObjCIvarRegion *IVR = dyn_cast(R)) return CastRetrievedVal(RetrieveObjCIvar(state, IVR), state, IVR, T); if (const VarRegion *VR = dyn_cast(R)) return CastRetrievedVal(RetrieveVar(state, VR), state, VR, T); RegionBindings B = GetRegionBindings(state->getStore()); RegionBindings::data_type* V = B.lookup(R); // Check if the region has a binding. if (V) return SValuator::CastResult(state, *V); // The location does not have a bound value. This means that it has // the value it had upon its creation and/or entry to the analyzed // function/method. These are either symbolic values or 'undefined'. #if HEAP_UNDEFINED if (R->hasHeapOrStackStorage()) { #else if (R->hasStackStorage()) { #endif // All stack variables are considered to have undefined values // upon creation. All heap allocated blocks are considered to // have undefined values as well unless they are explicitly bound // to specific values. return SValuator::CastResult(state, UndefinedVal()); } // All other values are symbolic. return SValuator::CastResult(state, ValMgr.getRegionValueSymbolValOrUnknown(R, RTy)); } std::pair RegionStoreManager::GetLazyBinding(RegionBindings B, const MemRegion *R) { if (const nonloc::LazyCompoundVal *V = dyn_cast_or_null(B.lookup(R))) return std::make_pair(V->getState(), V->getRegion()); if (const ElementRegion *ER = dyn_cast(R)) { const std::pair &X = GetLazyBinding(B, ER->getSuperRegion()); if (X.first) return std::make_pair(X.first, MRMgr.getElementRegionWithSuper(ER, X.second)); } else if (const FieldRegion *FR = dyn_cast(R)) { const std::pair &X = GetLazyBinding(B, FR->getSuperRegion()); if (X.first) return std::make_pair(X.first, MRMgr.getFieldRegionWithSuper(FR, X.second)); } return std::make_pair((const GRState*) 0, (const MemRegion *) 0); } SVal RegionStoreManager::RetrieveElement(const GRState* state, const ElementRegion* R) { // Check if the region has a binding. RegionBindings B = GetRegionBindings(state->getStore()); if (const SVal* V = B.lookup(R)) return *V; const MemRegion* superR = R->getSuperRegion(); // Check if the region is an element region of a string literal. if (const StringRegion *StrR=dyn_cast(superR)) { const StringLiteral *Str = StrR->getStringLiteral(); SVal Idx = R->getIndex(); if (nonloc::ConcreteInt *CI = dyn_cast(&Idx)) { int64_t i = CI->getValue().getSExtValue(); char c; if (i == Str->getByteLength()) c = '\0'; else c = Str->getStrData()[i]; return ValMgr.makeIntVal(c, getContext().CharTy); } } // Special case: the current region represents a cast and it and the super // region both have pointer types or intptr_t types. If so, perform the // retrieve from the super region and appropriately "cast" the value. // This is needed to support OSAtomicCompareAndSwap and friends or other // loads that treat integers as pointers and vis versa. if (R->getIndex().isZeroConstant()) { if (const TypedRegion *superTR = dyn_cast(superR)) { ASTContext &Ctx = getContext(); if (IsAnyPointerOrIntptr(superTR->getValueType(Ctx), Ctx)) { QualType valTy = R->getValueType(Ctx); if (IsAnyPointerOrIntptr(valTy, Ctx)) { // Retrieve the value from the super region. This will be casted to // valTy when we return to 'Retrieve'. const SValuator::CastResult &cr = Retrieve(state, loc::MemRegionVal(superR), valTy); return cr.getSVal(); } } } } // Check if the immediate super region has a direct binding. if (const SVal *V = B.lookup(superR)) { if (SymbolRef parentSym = V->getAsSymbol()) return ValMgr.getDerivedRegionValueSymbolVal(parentSym, R); if (V->isUnknownOrUndef()) return *V; // Handle LazyCompoundVals for the immediate super region. Other cases // are handled in 'RetrieveFieldOrElementCommon'. if (const nonloc::LazyCompoundVal *LCV = dyn_cast(V)) { R = MRMgr.getElementRegionWithSuper(R, LCV->getRegion()); return RetrieveElement(LCV->getState(), R); } // Other cases: give up. return UnknownVal(); } return RetrieveFieldOrElementCommon(state, R, R->getElementType(), superR); } SVal RegionStoreManager::RetrieveField(const GRState* state, const FieldRegion* R) { // Check if the region has a binding. RegionBindings B = GetRegionBindings(state->getStore()); if (const SVal* V = B.lookup(R)) return *V; QualType Ty = R->getValueType(getContext()); return RetrieveFieldOrElementCommon(state, R, Ty, R->getSuperRegion()); } SVal RegionStoreManager::RetrieveFieldOrElementCommon(const GRState *state, const TypedRegion *R, QualType Ty, const MemRegion *superR) { // At this point we have already checked in either RetrieveElement or // RetrieveField if 'R' has a direct binding. RegionBindings B = GetRegionBindings(state->getStore()); while (superR) { if (const Optional &D = getDefaultBinding(state, superR)) { if (SymbolRef parentSym = D->getAsSymbol()) return ValMgr.getDerivedRegionValueSymbolVal(parentSym, R); if (D->isZeroConstant()) return ValMgr.makeZeroVal(Ty); if (D->isUnknown()) return *D; assert(0 && "Unknown default value"); } // If our super region is a field or element itself, walk up the region // hierarchy to see if there is a default value installed in an ancestor. if (isa(superR) || isa(superR)) { superR = cast(superR)->getSuperRegion(); continue; } break; } // Lazy binding? const GRState *lazyBindingState = NULL; const MemRegion *lazyBindingRegion = NULL; llvm::tie(lazyBindingState, lazyBindingRegion) = GetLazyBinding(B, R); if (lazyBindingState) { assert(lazyBindingRegion && "Lazy-binding region not set"); if (isa(R)) return RetrieveElement(lazyBindingState, cast(lazyBindingRegion)); return RetrieveField(lazyBindingState, cast(lazyBindingRegion)); } if (R->hasStackStorage() && !R->hasParametersStorage()) { if (isa(R)) { // Currently we don't reason specially about Clang-style vectors. Check // if superR is a vector and if so return Unknown. if (const TypedRegion *typedSuperR = dyn_cast(superR)) { if (typedSuperR->getValueType(getContext())->isVectorType()) return UnknownVal(); } } return UndefinedVal(); } // All other values are symbolic. return ValMgr.getRegionValueSymbolValOrUnknown(R, Ty); } SVal RegionStoreManager::RetrieveObjCIvar(const GRState* state, const ObjCIvarRegion* R) { // Check if the region has a binding. RegionBindings B = GetRegionBindings(state->getStore()); if (const SVal* V = B.lookup(R)) return *V; const MemRegion *superR = R->getSuperRegion(); // Check if the super region has a binding. if (const SVal *V = B.lookup(superR)) { if (SymbolRef parentSym = V->getAsSymbol()) return ValMgr.getDerivedRegionValueSymbolVal(parentSym, R); // Other cases: give up. return UnknownVal(); } return RetrieveLazySymbol(state, R); } SVal RegionStoreManager::RetrieveVar(const GRState *state, const VarRegion *R) { // Check if the region has a binding. RegionBindings B = GetRegionBindings(state->getStore()); if (const SVal* V = B.lookup(R)) return *V; // Lazily derive a value for the VarRegion. const VarDecl *VD = R->getDecl(); if (R->hasGlobalsOrParametersStorage()) return ValMgr.getRegionValueSymbolValOrUnknown(R, VD->getType()); return UndefinedVal(); } SVal RegionStoreManager::RetrieveLazySymbol(const GRState *state, const TypedRegion *R) { QualType valTy = R->getValueType(getContext()); // All other values are symbolic. return ValMgr.getRegionValueSymbolValOrUnknown(R, valTy); } SVal RegionStoreManager::RetrieveStruct(const GRState *state, const TypedRegion* R){ QualType T = R->getValueType(getContext()); assert(T->isStructureType()); const RecordType* RT = T->getAsStructureType(); RecordDecl* RD = RT->getDecl(); assert(RD->isDefinition()); (void)RD; #if USE_EXPLICIT_COMPOUND llvm::ImmutableList StructVal = getBasicVals().getEmptySValList(); // FIXME: We shouldn't use a std::vector. If RecordDecl doesn't have a // reverse iterator, we should implement one. std::vector Fields(RD->field_begin(), RD->field_end()); for (std::vector::reverse_iterator Field = Fields.rbegin(), FieldEnd = Fields.rend(); Field != FieldEnd; ++Field) { FieldRegion* FR = MRMgr.getFieldRegion(*Field, R); QualType FTy = (*Field)->getType(); SVal FieldValue = Retrieve(state, loc::MemRegionVal(FR), FTy).getSVal(); StructVal = getBasicVals().consVals(FieldValue, StructVal); } return ValMgr.makeCompoundVal(T, StructVal); #else return ValMgr.makeLazyCompoundVal(state, R); #endif } SVal RegionStoreManager::RetrieveArray(const GRState *state, const TypedRegion * R) { #if USE_EXPLICIT_COMPOUND QualType T = R->getValueType(getContext()); ConstantArrayType* CAT = cast(T.getTypePtr()); llvm::ImmutableList ArrayVal = getBasicVals().getEmptySValList(); uint64_t size = CAT->getSize().getZExtValue(); for (uint64_t i = 0; i < size; ++i) { SVal Idx = ValMgr.makeArrayIndex(i); ElementRegion* ER = MRMgr.getElementRegion(CAT->getElementType(), Idx, R, getContext()); QualType ETy = ER->getElementType(); SVal ElementVal = Retrieve(state, loc::MemRegionVal(ER), ETy).getSVal(); ArrayVal = getBasicVals().consVals(ElementVal, ArrayVal); } return ValMgr.makeCompoundVal(T, ArrayVal); #else assert(isa(R->getValueType(getContext()))); return ValMgr.makeLazyCompoundVal(state, R); #endif } SValuator::CastResult RegionStoreManager::CastRetrievedVal(SVal V, const GRState *state, const TypedRegion *R, QualType castTy) { if (castTy.isNull()) return SValuator::CastResult(state, V); ASTContext &Ctx = getContext(); return ValMgr.getSValuator().EvalCast(V, state, castTy, R->getValueType(Ctx)); } //===----------------------------------------------------------------------===// // Binding values to regions. //===----------------------------------------------------------------------===// Store RegionStoreManager::Remove(Store store, Loc L) { const MemRegion* R = 0; if (isa(L)) R = cast(L).getRegion(); if (R) { RegionBindings B = GetRegionBindings(store); return RBFactory.Remove(B, R).getRoot(); } return store; } const GRState *RegionStoreManager::Bind(const GRState *state, Loc L, SVal V) { if (isa(L)) return state; // If we get here, the location should be a region. const MemRegion *R = cast(L).getRegion(); // Check if the region is a struct region. if (const TypedRegion* TR = dyn_cast(R)) if (TR->getValueType(getContext())->isStructureType()) return BindStruct(state, TR, V); // Special case: the current region represents a cast and it and the super // region both have pointer types or intptr_t types. If so, perform the // bind to the super region. // This is needed to support OSAtomicCompareAndSwap and friends or other // loads that treat integers as pointers and vis versa. if (const ElementRegion *ER = dyn_cast(R)) { if (ER->getIndex().isZeroConstant()) { if (const TypedRegion *superR = dyn_cast(ER->getSuperRegion())) { ASTContext &Ctx = getContext(); QualType superTy = superR->getValueType(Ctx); QualType erTy = ER->getValueType(Ctx); if (IsAnyPointerOrIntptr(superTy, Ctx) && IsAnyPointerOrIntptr(erTy, Ctx)) { SValuator::CastResult cr = ValMgr.getSValuator().EvalCast(V, state, superTy, erTy); return Bind(cr.getState(), loc::MemRegionVal(superR), cr.getSVal()); } } } } // Perform the binding. RegionBindings B = GetRegionBindings(state->getStore()); return state->makeWithStore(RBFactory.Add(B, R, V).getRoot()); } const GRState *RegionStoreManager::BindDecl(const GRState *ST, const VarDecl *VD, const LocationContext *LC, SVal InitVal) { QualType T = VD->getType(); VarRegion* VR = MRMgr.getVarRegion(VD, LC); if (T->isArrayType()) return BindArray(ST, VR, InitVal); if (T->isStructureType()) return BindStruct(ST, VR, InitVal); return Bind(ST, ValMgr.makeLoc(VR), InitVal); } // FIXME: this method should be merged into Bind(). const GRState * RegionStoreManager::BindCompoundLiteral(const GRState *state, const CompoundLiteralExpr* CL, SVal V) { CompoundLiteralRegion* R = MRMgr.getCompoundLiteralRegion(CL); return Bind(state, loc::MemRegionVal(R), V); } const GRState *RegionStoreManager::BindArray(const GRState *state, const TypedRegion* R, SVal Init) { QualType T = R->getValueType(getContext()); ConstantArrayType* CAT = cast(T.getTypePtr()); QualType ElementTy = CAT->getElementType(); uint64_t size = CAT->getSize().getZExtValue(); // Check if the init expr is a StringLiteral. if (isa(Init)) { const MemRegion* InitR = cast(Init).getRegion(); const StringLiteral* S = cast(InitR)->getStringLiteral(); const char* str = S->getStrData(); unsigned len = S->getByteLength(); unsigned j = 0; // Copy bytes from the string literal into the target array. Trailing bytes // in the array that are not covered by the string literal are initialized // to zero. for (uint64_t i = 0; i < size; ++i, ++j) { if (j >= len) break; SVal Idx = ValMgr.makeArrayIndex(i); ElementRegion* ER = MRMgr.getElementRegion(ElementTy, Idx, R, getContext()); SVal V = ValMgr.makeIntVal(str[j], sizeof(char)*8, true); state = Bind(state, loc::MemRegionVal(ER), V); } return state; } // Handle lazy compound values. if (nonloc::LazyCompoundVal *LCV = dyn_cast(&Init)) return CopyLazyBindings(*LCV, state, R); // Remaining case: explicit compound values. nonloc::CompoundVal& CV = cast(Init); nonloc::CompoundVal::iterator VI = CV.begin(), VE = CV.end(); uint64_t i = 0; for (; i < size; ++i, ++VI) { // The init list might be shorter than the array length. if (VI == VE) break; SVal Idx = ValMgr.makeArrayIndex(i); ElementRegion* ER = MRMgr.getElementRegion(ElementTy, Idx, R, getContext()); if (CAT->getElementType()->isStructureType()) state = BindStruct(state, ER, *VI); else state = Bind(state, ValMgr.makeLoc(ER), *VI); } // If the init list is shorter than the array length, set the array default // value. if (i < size) { if (ElementTy->isIntegerType()) { SVal V = ValMgr.makeZeroVal(ElementTy); state = setDefaultValue(state, R, V); } } return state; } const GRState * RegionStoreManager::BindStruct(const GRState *state, const TypedRegion* R, SVal V) { if (!Features.supportsFields()) return state; QualType T = R->getValueType(getContext()); assert(T->isStructureType()); const RecordType* RT = T->getAs(); RecordDecl* RD = RT->getDecl(); if (!RD->isDefinition()) return state; // Handle lazy compound values. if (const nonloc::LazyCompoundVal *LCV = dyn_cast(&V)) return CopyLazyBindings(*LCV, state, R); // We may get non-CompoundVal accidentally due to imprecise cast logic. // Ignore them and kill the field values. if (V.isUnknown() || !isa(V)) return KillStruct(state, R); nonloc::CompoundVal& CV = cast(V); nonloc::CompoundVal::iterator VI = CV.begin(), VE = CV.end(); RecordDecl::field_iterator FI, FE; for (FI = RD->field_begin(), FE = RD->field_end(); FI != FE; ++FI, ++VI) { if (VI == VE) break; QualType FTy = (*FI)->getType(); FieldRegion* FR = MRMgr.getFieldRegion(*FI, R); if (Loc::IsLocType(FTy) || FTy->isIntegerType()) state = Bind(state, ValMgr.makeLoc(FR), *VI); else if (FTy->isArrayType()) state = BindArray(state, FR, *VI); else if (FTy->isStructureType()) state = BindStruct(state, FR, *VI); } // There may be fewer values in the initialize list than the fields of struct. if (FI != FE) state = setDefaultValue(state, R, ValMgr.makeIntVal(0, false)); return state; } const GRState *RegionStoreManager::KillStruct(const GRState *state, const TypedRegion* R){ // Set the default value of the struct region to "unknown". state = state->set(R, UnknownVal()); // Remove all bindings for the subregions of the struct. Store store = state->getStore(); RegionBindings B = GetRegionBindings(store); for (RegionBindings::iterator I = B.begin(), E = B.end(); I != E; ++I) { const MemRegion* R = I.getKey(); if (const SubRegion* subRegion = dyn_cast(R)) if (subRegion->isSubRegionOf(R)) store = Remove(store, ValMgr.makeLoc(subRegion)); } return state->makeWithStore(store); } const GRState *RegionStoreManager::setDefaultValue(const GRState *state, const MemRegion* R, SVal V) { return state->set(R, V); } const GRState* RegionStoreManager::CopyLazyBindings(nonloc::LazyCompoundVal V, const GRState *state, const TypedRegion *R) { // Nuke the old bindings stemming from R. RegionBindings B = GetRegionBindings(state->getStore()); RegionDefaultBindings DVM = state->get(); RegionDefaultBindings::Factory &DVMFactory = state->get_context(); llvm::OwningPtr SubRegions(getRegionStoreSubRegionMap(state)); // B and DVM are updated after the call to RemoveSubRegionBindings. RemoveSubRegionBindings(B, DVM, DVMFactory, R, *SubRegions.get()); // Now copy the bindings. This amounts to just binding 'V' to 'R'. This // results in a zero-copy algorithm. return state->makeWithStore(RBFactory.Add(B, R, V).getRoot()); } //===----------------------------------------------------------------------===// // State pruning. //===----------------------------------------------------------------------===// static void UpdateLiveSymbols(SVal X, SymbolReaper& SymReaper) { if (loc::MemRegionVal *XR = dyn_cast(&X)) { const MemRegion *R = XR->getRegion(); while (R) { if (const SymbolicRegion *SR = dyn_cast(R)) { SymReaper.markLive(SR->getSymbol()); return; } if (const SubRegion *SR = dyn_cast(R)) { R = SR->getSuperRegion(); continue; } break; } return; } for (SVal::symbol_iterator SI=X.symbol_begin(), SE=X.symbol_end();SI!=SE;++SI) SymReaper.markLive(*SI); } namespace { class VISIBILITY_HIDDEN TreeScanner { RegionBindings B; RegionDefaultBindings DB; SymbolReaper &SymReaper; llvm::DenseSet &Marked; llvm::DenseSet &ScannedLazyVals; RegionStoreSubRegionMap &M; RegionStoreManager &RS; llvm::SmallVectorImpl &RegionRoots; const bool MarkKeys; public: TreeScanner(RegionBindings b, RegionDefaultBindings db, SymbolReaper &symReaper, llvm::DenseSet &marked, llvm::DenseSet &scannedLazyVals, RegionStoreSubRegionMap &m, RegionStoreManager &rs, llvm::SmallVectorImpl ®ionRoots, bool markKeys = true) : B(b), DB(db), SymReaper(symReaper), Marked(marked), ScannedLazyVals(scannedLazyVals), M(m), RS(rs), RegionRoots(regionRoots), MarkKeys(markKeys) {} void scanTree(const MemRegion *R); }; } // end anonymous namespace void TreeScanner::scanTree(const MemRegion *R) { if (MarkKeys) { if (Marked.count(R)) return; Marked.insert(R); } // Mark the symbol for any live SymbolicRegion as "live". This means we // should continue to track that symbol. if (const SymbolicRegion* SymR = dyn_cast(R)) SymReaper.markLive(SymR->getSymbol()); // Get the data binding for R (if any). const SVal* Xptr = B.lookup(R); // Check for lazy bindings. if (const nonloc::LazyCompoundVal *V = dyn_cast_or_null(Xptr)) { const LazyCompoundValData *D = V->getCVData(); if (!ScannedLazyVals.count(D)) { // Scan the bindings in the LazyCompoundVal. ScannedLazyVals.insert(D); // FIXME: Cache subregion maps. const GRState *lazyState = D->getState(); llvm::OwningPtr lazySM(RS.getRegionStoreSubRegionMap(lazyState)); Store lazyStore = lazyState->getStore(); RegionBindings lazyB = RS.GetRegionBindings(lazyStore); RegionDefaultBindings lazyDB = lazyState->get(); // Scan the bindings. TreeScanner scan(lazyB, lazyDB, SymReaper, Marked, ScannedLazyVals, *lazySM.get(), RS, RegionRoots, false); scan.scanTree(D->getRegion()); } } else { // No direct binding? Get the default binding for R (if any). if (!Xptr) Xptr = DB.lookup(R); // Direct or default binding? if (Xptr) { SVal X = *Xptr; UpdateLiveSymbols(X, SymReaper); // Update the set of live symbols. // If X is a region, then add it to the RegionRoots. if (const MemRegion *RX = X.getAsRegion()) { RegionRoots.push_back(RX); // Mark the super region of the RX as live. // e.g.: int x; char *y = (char*) &x; if (*y) ... // 'y' => element region. 'x' is its super region. if (const SubRegion *SR = dyn_cast(RX)) { RegionRoots.push_back(SR->getSuperRegion()); } } } } RegionStoreSubRegionMap::iterator I, E; for (llvm::tie(I, E) = M.begin_end(R); I != E; ++I) scanTree(*I); } void RegionStoreManager::RemoveDeadBindings(GRState &state, Stmt* Loc, SymbolReaper& SymReaper, llvm::SmallVectorImpl& RegionRoots) { Store store = state.getStore(); RegionBindings B = GetRegionBindings(store); // Lazily constructed backmap from MemRegions to SubRegions. typedef llvm::ImmutableSet SubRegionsTy; typedef llvm::ImmutableMap SubRegionsMapTy; // The backmap from regions to subregions. llvm::OwningPtr SubRegions(getRegionStoreSubRegionMap(&state)); // Do a pass over the regions in the store. For VarRegions we check if // the variable is still live and if so add it to the list of live roots. // For other regions we populate our region backmap. llvm::SmallVector IntermediateRoots; // Scan the direct bindings for "intermediate" roots. for (RegionBindings::iterator I = B.begin(), E = B.end(); I != E; ++I) { const MemRegion *R = I.getKey(); IntermediateRoots.push_back(R); } // Scan the default bindings for "intermediate" roots. RegionDefaultBindings DVM = state.get(); for (RegionDefaultBindings::iterator I = DVM.begin(), E = DVM.end(); I != E; ++I) { const MemRegion *R = I.getKey(); IntermediateRoots.push_back(R); } // Process the "intermediate" roots to find if they are referenced by // real roots. while (!IntermediateRoots.empty()) { const MemRegion* R = IntermediateRoots.back(); IntermediateRoots.pop_back(); if (const VarRegion* VR = dyn_cast(R)) { if (SymReaper.isLive(Loc, VR->getDecl())) { RegionRoots.push_back(VR); // This is a live "root". } continue; } if (const SymbolicRegion* SR = dyn_cast(R)) { if (SymReaper.isLive(SR->getSymbol())) RegionRoots.push_back(SR); continue; } // Add the super region for R to the worklist if it is a subregion. if (const SubRegion* superR = dyn_cast(cast(R)->getSuperRegion())) IntermediateRoots.push_back(superR); } // Process the worklist of RegionRoots. This performs a "mark-and-sweep" // of the store. We want to find all live symbols and dead regions. llvm::DenseSet Marked; llvm::DenseSet LazyVals; TreeScanner TS(B, DVM, SymReaper, Marked, LazyVals, *SubRegions.get(), *this, RegionRoots); while (!RegionRoots.empty()) { const MemRegion *R = RegionRoots.back(); RegionRoots.pop_back(); TS.scanTree(R); } // We have now scanned the store, marking reachable regions and symbols // as live. We now remove all the regions that are dead from the store // as well as update DSymbols with the set symbols that are now dead. for (RegionBindings::iterator I = B.begin(), E = B.end(); I != E; ++I) { const MemRegion* R = I.getKey(); // If this region live? Is so, none of its symbols are dead. if (Marked.count(R)) continue; // Remove this dead region from the store. store = Remove(store, ValMgr.makeLoc(R)); // Mark all non-live symbols that this region references as dead. if (const SymbolicRegion* SymR = dyn_cast(R)) SymReaper.maybeDead(SymR->getSymbol()); SVal X = I.getData(); SVal::symbol_iterator SI = X.symbol_begin(), SE = X.symbol_end(); for (; SI != SE; ++SI) SymReaper.maybeDead(*SI); } // Remove dead 'default' bindings. RegionDefaultBindings NewDVM = DVM; RegionDefaultBindings::Factory &DVMFactory = state.get_context(); for (RegionDefaultBindings::iterator I = DVM.begin(), E = DVM.end(); I != E; ++I) { const MemRegion *R = I.getKey(); // If this region live? Is so, none of its symbols are dead. if (Marked.count(R)) continue; // Remove this dead region. NewDVM = DVMFactory.Remove(NewDVM, R); // Mark all non-live symbols that this region references as dead. if (const SymbolicRegion* SymR = dyn_cast(R)) SymReaper.maybeDead(SymR->getSymbol()); SVal X = I.getData(); SVal::symbol_iterator SI = X.symbol_begin(), SE = X.symbol_end(); for (; SI != SE; ++SI) SymReaper.maybeDead(*SI); } // Write the store back. state.setStore(store); // Write the updated default bindings back. // FIXME: Right now this involves a fetching of a persistent state. // We can do better. if (DVM != NewDVM) state.setGDM(state.set(NewDVM)->getGDM()); } //===----------------------------------------------------------------------===// // Utility methods. //===----------------------------------------------------------------------===// void RegionStoreManager::print(Store store, llvm::raw_ostream& OS, const char* nl, const char *sep) { RegionBindings B = GetRegionBindings(store); OS << "Store (direct bindings):" << nl; for (RegionBindings::iterator I = B.begin(), E = B.end(); I != E; ++I) OS << ' ' << I.getKey() << " : " << I.getData() << nl; }