MallocChecker.cpp revision 919e8a1c6698bfa6848571d366430126bced727d
1//=== MallocChecker.cpp - A malloc/free checker -------------------*- C++ -*--//
2//
3//                     The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file defines malloc/free checker, which checks for potential memory
11// leaks, double free, and use-after-free problems.
12//
13//===----------------------------------------------------------------------===//
14
15#include "ClangSACheckers.h"
16#include "InterCheckerAPI.h"
17#include "clang/StaticAnalyzer/Core/Checker.h"
18#include "clang/StaticAnalyzer/Core/CheckerManager.h"
19#include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h"
20#include "clang/StaticAnalyzer/Core/BugReporter/BugType.h"
21#include "clang/StaticAnalyzer/Core/PathSensitive/CallEvent.h"
22#include "clang/StaticAnalyzer/Core/PathSensitive/ProgramState.h"
23#include "clang/StaticAnalyzer/Core/PathSensitive/ProgramStateTrait.h"
24#include "clang/StaticAnalyzer/Core/PathSensitive/SymbolManager.h"
25#include "clang/Basic/SourceManager.h"
26#include "llvm/ADT/ImmutableMap.h"
27#include "llvm/ADT/SmallString.h"
28#include "llvm/ADT/STLExtras.h"
29#include <climits>
30
31using namespace clang;
32using namespace ento;
33
34namespace {
35
36class RefState {
37  enum Kind { // Reference to allocated memory.
38              Allocated,
39              // Reference to released/freed memory.
40              Released,
41              // Reference to escaped memory - no assumptions can be made of
42              // the state after the reference escapes.
43              Escaped,
44              // The responsibility for freeing resources has transfered from
45              // this reference. A relinquished symbol should not be freed.
46              Relinquished } K;
47  const Stmt *S;
48
49public:
50  RefState(Kind k, const Stmt *s) : K(k), S(s) {}
51
52  bool isAllocated() const { return K == Allocated; }
53  bool isReleased() const { return K == Released; }
54  bool isRelinquished() const { return K == Relinquished; }
55
56  const Stmt *getStmt() const { return S; }
57
58  bool operator==(const RefState &X) const {
59    return K == X.K && S == X.S;
60  }
61
62  static RefState getAllocated(const Stmt *s) {
63    return RefState(Allocated, s);
64  }
65  static RefState getReleased(const Stmt *s) { return RefState(Released, s); }
66  static RefState getEscaped(const Stmt *s) { return RefState(Escaped, s); }
67  static RefState getRelinquished(const Stmt *s) {
68    return RefState(Relinquished, s);
69  }
70
71  void Profile(llvm::FoldingSetNodeID &ID) const {
72    ID.AddInteger(K);
73    ID.AddPointer(S);
74  }
75};
76
77struct ReallocPair {
78  SymbolRef ReallocatedSym;
79  bool IsFreeOnFailure;
80  ReallocPair(SymbolRef S, bool F) : ReallocatedSym(S), IsFreeOnFailure(F) {}
81  void Profile(llvm::FoldingSetNodeID &ID) const {
82    ID.AddInteger(IsFreeOnFailure);
83    ID.AddPointer(ReallocatedSym);
84  }
85  bool operator==(const ReallocPair &X) const {
86    return ReallocatedSym == X.ReallocatedSym &&
87           IsFreeOnFailure == X.IsFreeOnFailure;
88  }
89};
90
91typedef std::pair<const Stmt*, const MemRegion*> LeakInfo;
92
93class MallocChecker : public Checker<check::DeadSymbols,
94                                     check::EndPath,
95                                     check::PreStmt<ReturnStmt>,
96                                     check::PreStmt<CallExpr>,
97                                     check::PostStmt<CallExpr>,
98                                     check::PostStmt<BlockExpr>,
99                                     check::PreObjCMessage,
100                                     check::Location,
101                                     check::Bind,
102                                     eval::Assume,
103                                     check::RegionChanges>
104{
105  mutable OwningPtr<BugType> BT_DoubleFree;
106  mutable OwningPtr<BugType> BT_Leak;
107  mutable OwningPtr<BugType> BT_UseFree;
108  mutable OwningPtr<BugType> BT_BadFree;
109  mutable IdentifierInfo *II_malloc, *II_free, *II_realloc, *II_calloc,
110                         *II_valloc, *II_reallocf, *II_strndup, *II_strdup;
111
112public:
113  MallocChecker() : II_malloc(0), II_free(0), II_realloc(0), II_calloc(0),
114                    II_valloc(0), II_reallocf(0), II_strndup(0), II_strdup(0) {}
115
116  /// In pessimistic mode, the checker assumes that it does not know which
117  /// functions might free the memory.
118  struct ChecksFilter {
119    DefaultBool CMallocPessimistic;
120    DefaultBool CMallocOptimistic;
121  };
122
123  ChecksFilter Filter;
124
125  void checkPreStmt(const CallExpr *S, CheckerContext &C) const;
126  void checkPostStmt(const CallExpr *CE, CheckerContext &C) const;
127  void checkPreObjCMessage(const ObjCMethodCall &Call, CheckerContext &C) const;
128  void checkPostStmt(const BlockExpr *BE, CheckerContext &C) const;
129  void checkDeadSymbols(SymbolReaper &SymReaper, CheckerContext &C) const;
130  void checkEndPath(CheckerContext &C) const;
131  void checkPreStmt(const ReturnStmt *S, CheckerContext &C) const;
132  ProgramStateRef evalAssume(ProgramStateRef state, SVal Cond,
133                            bool Assumption) const;
134  void checkLocation(SVal l, bool isLoad, const Stmt *S,
135                     CheckerContext &C) const;
136  void checkBind(SVal location, SVal val, const Stmt*S,
137                 CheckerContext &C) const;
138  ProgramStateRef
139  checkRegionChanges(ProgramStateRef state,
140                     const StoreManager::InvalidatedSymbols *invalidated,
141                     ArrayRef<const MemRegion *> ExplicitRegions,
142                     ArrayRef<const MemRegion *> Regions,
143                     const CallEvent *Call) const;
144  bool wantsRegionChangeUpdate(ProgramStateRef state) const {
145    return true;
146  }
147
148  void printState(raw_ostream &Out, ProgramStateRef State,
149                  const char *NL, const char *Sep) const;
150
151private:
152  void initIdentifierInfo(ASTContext &C) const;
153
154  /// Check if this is one of the functions which can allocate/reallocate memory
155  /// pointed to by one of its arguments.
156  bool isMemFunction(const FunctionDecl *FD, ASTContext &C) const;
157  bool isFreeFunction(const FunctionDecl *FD, ASTContext &C) const;
158  bool isAllocationFunction(const FunctionDecl *FD, ASTContext &C) const;
159
160  static ProgramStateRef MallocMemReturnsAttr(CheckerContext &C,
161                                              const CallExpr *CE,
162                                              const OwnershipAttr* Att);
163  static ProgramStateRef MallocMemAux(CheckerContext &C, const CallExpr *CE,
164                                     const Expr *SizeEx, SVal Init,
165                                     ProgramStateRef state) {
166    return MallocMemAux(C, CE,
167                        state->getSVal(SizeEx, C.getLocationContext()),
168                        Init, state);
169  }
170
171  static ProgramStateRef MallocMemAux(CheckerContext &C, const CallExpr *CE,
172                                     SVal SizeEx, SVal Init,
173                                     ProgramStateRef state);
174
175  /// Update the RefState to reflect the new memory allocation.
176  static ProgramStateRef MallocUpdateRefState(CheckerContext &C,
177                                              const CallExpr *CE,
178                                              ProgramStateRef state);
179
180  ProgramStateRef FreeMemAttr(CheckerContext &C, const CallExpr *CE,
181                              const OwnershipAttr* Att) const;
182  ProgramStateRef FreeMemAux(CheckerContext &C, const CallExpr *CE,
183                             ProgramStateRef state, unsigned Num,
184                             bool Hold) const;
185  ProgramStateRef FreeMemAux(CheckerContext &C, const Expr *Arg,
186                             const Expr *ParentExpr,
187                             ProgramStateRef state,
188                             bool Hold) const;
189
190  ProgramStateRef ReallocMem(CheckerContext &C, const CallExpr *CE,
191                             bool FreesMemOnFailure) const;
192  static ProgramStateRef CallocMem(CheckerContext &C, const CallExpr *CE);
193
194  ///\brief Check if the memory associated with this symbol was released.
195  bool isReleased(SymbolRef Sym, CheckerContext &C) const;
196
197  bool checkEscape(SymbolRef Sym, const Stmt *S, CheckerContext &C) const;
198  bool checkUseAfterFree(SymbolRef Sym, CheckerContext &C,
199                         const Stmt *S = 0) const;
200
201  /// Check if the function is not known to us. So, for example, we could
202  /// conservatively assume it can free/reallocate it's pointer arguments.
203  bool doesNotFreeMemory(const CallEvent *Call,
204                         ProgramStateRef State) const;
205
206  static bool SummarizeValue(raw_ostream &os, SVal V);
207  static bool SummarizeRegion(raw_ostream &os, const MemRegion *MR);
208  void ReportBadFree(CheckerContext &C, SVal ArgVal, SourceRange range) const;
209
210  /// Find the location of the allocation for Sym on the path leading to the
211  /// exploded node N.
212  LeakInfo getAllocationSite(const ExplodedNode *N, SymbolRef Sym,
213                             CheckerContext &C) const;
214
215  void reportLeak(SymbolRef Sym, ExplodedNode *N, CheckerContext &C) const;
216
217  /// The bug visitor which allows us to print extra diagnostics along the
218  /// BugReport path. For example, showing the allocation site of the leaked
219  /// region.
220  class MallocBugVisitor : public BugReporterVisitorImpl<MallocBugVisitor> {
221  protected:
222    enum NotificationMode {
223      Normal,
224      ReallocationFailed
225    };
226
227    // The allocated region symbol tracked by the main analysis.
228    SymbolRef Sym;
229
230    // The mode we are in, i.e. what kind of diagnostics will be emitted.
231    NotificationMode Mode;
232
233    // A symbol from when the primary region should have been reallocated.
234    SymbolRef FailedReallocSymbol;
235
236    bool IsLeak;
237
238  public:
239    MallocBugVisitor(SymbolRef S, bool isLeak = false)
240       : Sym(S), Mode(Normal), FailedReallocSymbol(0), IsLeak(isLeak) {}
241
242    virtual ~MallocBugVisitor() {}
243
244    void Profile(llvm::FoldingSetNodeID &ID) const {
245      static int X = 0;
246      ID.AddPointer(&X);
247      ID.AddPointer(Sym);
248    }
249
250    inline bool isAllocated(const RefState *S, const RefState *SPrev,
251                            const Stmt *Stmt) {
252      // Did not track -> allocated. Other state (released) -> allocated.
253      return (Stmt && isa<CallExpr>(Stmt) &&
254              (S && S->isAllocated()) && (!SPrev || !SPrev->isAllocated()));
255    }
256
257    inline bool isReleased(const RefState *S, const RefState *SPrev,
258                           const Stmt *Stmt) {
259      // Did not track -> released. Other state (allocated) -> released.
260      return (Stmt && isa<CallExpr>(Stmt) &&
261              (S && S->isReleased()) && (!SPrev || !SPrev->isReleased()));
262    }
263
264    inline bool isRelinquished(const RefState *S, const RefState *SPrev,
265                               const Stmt *Stmt) {
266      // Did not track -> relinquished. Other state (allocated) -> relinquished.
267      return (Stmt && (isa<CallExpr>(Stmt) || isa<ObjCMessageExpr>(Stmt) ||
268                                              isa<ObjCPropertyRefExpr>(Stmt)) &&
269              (S && S->isRelinquished()) &&
270              (!SPrev || !SPrev->isRelinquished()));
271    }
272
273    inline bool isReallocFailedCheck(const RefState *S, const RefState *SPrev,
274                                     const Stmt *Stmt) {
275      // If the expression is not a call, and the state change is
276      // released -> allocated, it must be the realloc return value
277      // check. If we have to handle more cases here, it might be cleaner just
278      // to track this extra bit in the state itself.
279      return ((!Stmt || !isa<CallExpr>(Stmt)) &&
280              (S && S->isAllocated()) && (SPrev && !SPrev->isAllocated()));
281    }
282
283    PathDiagnosticPiece *VisitNode(const ExplodedNode *N,
284                                   const ExplodedNode *PrevN,
285                                   BugReporterContext &BRC,
286                                   BugReport &BR);
287
288    PathDiagnosticPiece* getEndPath(BugReporterContext &BRC,
289                                    const ExplodedNode *EndPathNode,
290                                    BugReport &BR) {
291      if (!IsLeak)
292        return 0;
293
294      PathDiagnosticLocation L =
295        PathDiagnosticLocation::createEndOfPath(EndPathNode,
296                                                BRC.getSourceManager());
297      // Do not add the statement itself as a range in case of leak.
298      return new PathDiagnosticEventPiece(L, BR.getDescription(), false);
299    }
300
301  private:
302    class StackHintGeneratorForReallocationFailed
303        : public StackHintGeneratorForSymbol {
304    public:
305      StackHintGeneratorForReallocationFailed(SymbolRef S, StringRef M)
306        : StackHintGeneratorForSymbol(S, M) {}
307
308      virtual std::string getMessageForArg(const Expr *ArgE, unsigned ArgIndex) {
309        SmallString<200> buf;
310        llvm::raw_svector_ostream os(buf);
311
312        os << "Reallocation of ";
313        // Printed parameters start at 1, not 0.
314        printOrdinal(++ArgIndex, os);
315        os << " parameter failed";
316
317        return os.str();
318      }
319
320      virtual std::string getMessageForReturn(const CallExpr *CallExpr) {
321        return "Reallocation of returned value failed";
322      }
323    };
324  };
325};
326} // end anonymous namespace
327
328typedef llvm::ImmutableMap<SymbolRef, RefState> RegionStateTy;
329typedef llvm::ImmutableMap<SymbolRef, ReallocPair > ReallocMap;
330class RegionState {};
331class ReallocPairs {};
332namespace clang {
333namespace ento {
334  template <>
335  struct ProgramStateTrait<RegionState>
336    : public ProgramStatePartialTrait<RegionStateTy> {
337    static void *GDMIndex() { static int x; return &x; }
338  };
339
340  template <>
341  struct ProgramStateTrait<ReallocPairs>
342    : public ProgramStatePartialTrait<ReallocMap> {
343    static void *GDMIndex() { static int x; return &x; }
344  };
345}
346}
347
348namespace {
349class StopTrackingCallback : public SymbolVisitor {
350  ProgramStateRef state;
351public:
352  StopTrackingCallback(ProgramStateRef st) : state(st) {}
353  ProgramStateRef getState() const { return state; }
354
355  bool VisitSymbol(SymbolRef sym) {
356    state = state->remove<RegionState>(sym);
357    return true;
358  }
359};
360} // end anonymous namespace
361
362void MallocChecker::initIdentifierInfo(ASTContext &Ctx) const {
363  if (II_malloc)
364    return;
365  II_malloc = &Ctx.Idents.get("malloc");
366  II_free = &Ctx.Idents.get("free");
367  II_realloc = &Ctx.Idents.get("realloc");
368  II_reallocf = &Ctx.Idents.get("reallocf");
369  II_calloc = &Ctx.Idents.get("calloc");
370  II_valloc = &Ctx.Idents.get("valloc");
371  II_strdup = &Ctx.Idents.get("strdup");
372  II_strndup = &Ctx.Idents.get("strndup");
373}
374
375bool MallocChecker::isMemFunction(const FunctionDecl *FD, ASTContext &C) const {
376  if (isFreeFunction(FD, C))
377    return true;
378
379  if (isAllocationFunction(FD, C))
380    return true;
381
382  return false;
383}
384
385bool MallocChecker::isAllocationFunction(const FunctionDecl *FD,
386                                         ASTContext &C) const {
387  if (!FD)
388    return false;
389
390  if (FD->getKind() == Decl::Function) {
391    IdentifierInfo *FunI = FD->getIdentifier();
392    initIdentifierInfo(C);
393
394    if (FunI == II_malloc || FunI == II_realloc ||
395        FunI == II_reallocf || FunI == II_calloc || FunI == II_valloc ||
396        FunI == II_strdup || FunI == II_strndup)
397      return true;
398  }
399
400  if (Filter.CMallocOptimistic && FD->hasAttrs())
401    for (specific_attr_iterator<OwnershipAttr>
402           i = FD->specific_attr_begin<OwnershipAttr>(),
403           e = FD->specific_attr_end<OwnershipAttr>();
404           i != e; ++i)
405      if ((*i)->getOwnKind() == OwnershipAttr::Returns)
406        return true;
407  return false;
408}
409
410bool MallocChecker::isFreeFunction(const FunctionDecl *FD, ASTContext &C) const {
411  if (!FD)
412    return false;
413
414  if (FD->getKind() == Decl::Function) {
415    IdentifierInfo *FunI = FD->getIdentifier();
416    initIdentifierInfo(C);
417
418    if (FunI == II_free || FunI == II_realloc || FunI == II_reallocf)
419      return true;
420  }
421
422  if (Filter.CMallocOptimistic && FD->hasAttrs())
423    for (specific_attr_iterator<OwnershipAttr>
424           i = FD->specific_attr_begin<OwnershipAttr>(),
425           e = FD->specific_attr_end<OwnershipAttr>();
426           i != e; ++i)
427      if ((*i)->getOwnKind() == OwnershipAttr::Takes ||
428          (*i)->getOwnKind() == OwnershipAttr::Holds)
429        return true;
430  return false;
431}
432
433void MallocChecker::checkPostStmt(const CallExpr *CE, CheckerContext &C) const {
434  const FunctionDecl *FD = C.getCalleeDecl(CE);
435  if (!FD)
436    return;
437
438  ProgramStateRef State = C.getState();
439
440  if (FD->getKind() == Decl::Function) {
441    initIdentifierInfo(C.getASTContext());
442    IdentifierInfo *FunI = FD->getIdentifier();
443
444    if (FunI == II_malloc || FunI == II_valloc) {
445      if (CE->getNumArgs() < 1)
446        return;
447      State = MallocMemAux(C, CE, CE->getArg(0), UndefinedVal(), State);
448    } else if (FunI == II_realloc) {
449      State = ReallocMem(C, CE, false);
450    } else if (FunI == II_reallocf) {
451      State = ReallocMem(C, CE, true);
452    } else if (FunI == II_calloc) {
453      State = CallocMem(C, CE);
454    } else if (FunI == II_free) {
455      State = FreeMemAux(C, CE, State, 0, false);
456    } else if (FunI == II_strdup) {
457      State = MallocUpdateRefState(C, CE, State);
458    } else if (FunI == II_strndup) {
459      State = MallocUpdateRefState(C, CE, State);
460    }
461  }
462
463  if (Filter.CMallocOptimistic) {
464    // Check all the attributes, if there are any.
465    // There can be multiple of these attributes.
466    if (FD->hasAttrs())
467      for (specific_attr_iterator<OwnershipAttr>
468          i = FD->specific_attr_begin<OwnershipAttr>(),
469          e = FD->specific_attr_end<OwnershipAttr>();
470          i != e; ++i) {
471        switch ((*i)->getOwnKind()) {
472        case OwnershipAttr::Returns:
473          State = MallocMemReturnsAttr(C, CE, *i);
474          break;
475        case OwnershipAttr::Takes:
476        case OwnershipAttr::Holds:
477          State = FreeMemAttr(C, CE, *i);
478          break;
479        }
480      }
481  }
482  C.addTransition(State);
483}
484
485static bool isFreeWhenDoneSetToZero(const ObjCMethodCall &Call) {
486  Selector S = Call.getSelector();
487  for (unsigned i = 1; i < S.getNumArgs(); ++i)
488    if (S.getNameForSlot(i).equals("freeWhenDone"))
489      if (Call.getArgSVal(i).isConstant(0))
490        return true;
491
492  return false;
493}
494
495void MallocChecker::checkPreObjCMessage(const ObjCMethodCall &Call,
496                                        CheckerContext &C) const {
497  // If the first selector is dataWithBytesNoCopy, assume that the memory will
498  // be released with 'free' by the new object.
499  // Ex:  [NSData dataWithBytesNoCopy:bytes length:10];
500  // Unless 'freeWhenDone' param set to 0.
501  // TODO: Check that the memory was allocated with malloc.
502  Selector S = Call.getSelector();
503  if ((S.getNameForSlot(0) == "dataWithBytesNoCopy" ||
504       S.getNameForSlot(0) == "initWithBytesNoCopy" ||
505       S.getNameForSlot(0) == "initWithCharactersNoCopy") &&
506      !isFreeWhenDoneSetToZero(Call)){
507    unsigned int argIdx  = 0;
508    C.addTransition(FreeMemAux(C, Call.getArgExpr(argIdx),
509                    Call.getOriginExpr(), C.getState(), true));
510  }
511}
512
513ProgramStateRef MallocChecker::MallocMemReturnsAttr(CheckerContext &C,
514                                                    const CallExpr *CE,
515                                                    const OwnershipAttr* Att) {
516  if (Att->getModule() != "malloc")
517    return 0;
518
519  OwnershipAttr::args_iterator I = Att->args_begin(), E = Att->args_end();
520  if (I != E) {
521    return MallocMemAux(C, CE, CE->getArg(*I), UndefinedVal(), C.getState());
522  }
523  return MallocMemAux(C, CE, UnknownVal(), UndefinedVal(), C.getState());
524}
525
526ProgramStateRef MallocChecker::MallocMemAux(CheckerContext &C,
527                                           const CallExpr *CE,
528                                           SVal Size, SVal Init,
529                                           ProgramStateRef state) {
530
531  // Bind the return value to the symbolic value from the heap region.
532  // TODO: We could rewrite post visit to eval call; 'malloc' does not have
533  // side effects other than what we model here.
534  unsigned Count = C.getCurrentBlockCount();
535  SValBuilder &svalBuilder = C.getSValBuilder();
536  const LocationContext *LCtx = C.getPredecessor()->getLocationContext();
537  DefinedSVal RetVal =
538    cast<DefinedSVal>(svalBuilder.getConjuredHeapSymbolVal(CE, LCtx, Count));
539  state = state->BindExpr(CE, C.getLocationContext(), RetVal);
540
541  // We expect the malloc functions to return a pointer.
542  if (!isa<Loc>(RetVal))
543    return 0;
544
545  // Fill the region with the initialization value.
546  state = state->bindDefault(RetVal, Init);
547
548  // Set the region's extent equal to the Size parameter.
549  const SymbolicRegion *R =
550      dyn_cast_or_null<SymbolicRegion>(RetVal.getAsRegion());
551  if (!R)
552    return 0;
553  if (isa<DefinedOrUnknownSVal>(Size)) {
554    SValBuilder &svalBuilder = C.getSValBuilder();
555    DefinedOrUnknownSVal Extent = R->getExtent(svalBuilder);
556    DefinedOrUnknownSVal DefinedSize = cast<DefinedOrUnknownSVal>(Size);
557    DefinedOrUnknownSVal extentMatchesSize =
558        svalBuilder.evalEQ(state, Extent, DefinedSize);
559
560    state = state->assume(extentMatchesSize, true);
561    assert(state);
562  }
563
564  return MallocUpdateRefState(C, CE, state);
565}
566
567ProgramStateRef MallocChecker::MallocUpdateRefState(CheckerContext &C,
568                                                    const CallExpr *CE,
569                                                    ProgramStateRef state) {
570  // Get the return value.
571  SVal retVal = state->getSVal(CE, C.getLocationContext());
572
573  // We expect the malloc functions to return a pointer.
574  if (!isa<Loc>(retVal))
575    return 0;
576
577  SymbolRef Sym = retVal.getAsLocSymbol();
578  assert(Sym);
579
580  // Set the symbol's state to Allocated.
581  return state->set<RegionState>(Sym, RefState::getAllocated(CE));
582
583}
584
585ProgramStateRef MallocChecker::FreeMemAttr(CheckerContext &C,
586                                           const CallExpr *CE,
587                                           const OwnershipAttr* Att) const {
588  if (Att->getModule() != "malloc")
589    return 0;
590
591  ProgramStateRef State = C.getState();
592
593  for (OwnershipAttr::args_iterator I = Att->args_begin(), E = Att->args_end();
594       I != E; ++I) {
595    ProgramStateRef StateI = FreeMemAux(C, CE, State, *I,
596                               Att->getOwnKind() == OwnershipAttr::Holds);
597    if (StateI)
598      State = StateI;
599  }
600  return State;
601}
602
603ProgramStateRef MallocChecker::FreeMemAux(CheckerContext &C,
604                                          const CallExpr *CE,
605                                          ProgramStateRef state,
606                                          unsigned Num,
607                                          bool Hold) const {
608  if (CE->getNumArgs() < (Num + 1))
609    return 0;
610
611  return FreeMemAux(C, CE->getArg(Num), CE, state, Hold);
612}
613
614ProgramStateRef MallocChecker::FreeMemAux(CheckerContext &C,
615                                          const Expr *ArgExpr,
616                                          const Expr *ParentExpr,
617                                          ProgramStateRef state,
618                                          bool Hold) const {
619
620  SVal ArgVal = state->getSVal(ArgExpr, C.getLocationContext());
621  if (!isa<DefinedOrUnknownSVal>(ArgVal))
622    return 0;
623  DefinedOrUnknownSVal location = cast<DefinedOrUnknownSVal>(ArgVal);
624
625  // Check for null dereferences.
626  if (!isa<Loc>(location))
627    return 0;
628
629  // The explicit NULL case, no operation is performed.
630  ProgramStateRef notNullState, nullState;
631  llvm::tie(notNullState, nullState) = state->assume(location);
632  if (nullState && !notNullState)
633    return 0;
634
635  // Unknown values could easily be okay
636  // Undefined values are handled elsewhere
637  if (ArgVal.isUnknownOrUndef())
638    return 0;
639
640  const MemRegion *R = ArgVal.getAsRegion();
641
642  // Nonlocs can't be freed, of course.
643  // Non-region locations (labels and fixed addresses) also shouldn't be freed.
644  if (!R) {
645    ReportBadFree(C, ArgVal, ArgExpr->getSourceRange());
646    return 0;
647  }
648
649  R = R->StripCasts();
650
651  // Blocks might show up as heap data, but should not be free()d
652  if (isa<BlockDataRegion>(R)) {
653    ReportBadFree(C, ArgVal, ArgExpr->getSourceRange());
654    return 0;
655  }
656
657  const MemSpaceRegion *MS = R->getMemorySpace();
658
659  // Parameters, locals, statics, and globals shouldn't be freed.
660  if (!(isa<UnknownSpaceRegion>(MS) || isa<HeapSpaceRegion>(MS))) {
661    // FIXME: at the time this code was written, malloc() regions were
662    // represented by conjured symbols, which are all in UnknownSpaceRegion.
663    // This means that there isn't actually anything from HeapSpaceRegion
664    // that should be freed, even though we allow it here.
665    // Of course, free() can work on memory allocated outside the current
666    // function, so UnknownSpaceRegion is always a possibility.
667    // False negatives are better than false positives.
668
669    ReportBadFree(C, ArgVal, ArgExpr->getSourceRange());
670    return 0;
671  }
672
673  const SymbolicRegion *SR = dyn_cast<SymbolicRegion>(R);
674  // Various cases could lead to non-symbol values here.
675  // For now, ignore them.
676  if (!SR)
677    return 0;
678
679  SymbolRef Sym = SR->getSymbol();
680  const RefState *RS = state->get<RegionState>(Sym);
681
682  // Check double free.
683  if (RS && (RS->isReleased() || RS->isRelinquished())) {
684    if (ExplodedNode *N = C.generateSink()) {
685      if (!BT_DoubleFree)
686        BT_DoubleFree.reset(
687          new BugType("Double free", "Memory Error"));
688      BugReport *R = new BugReport(*BT_DoubleFree,
689        (RS->isReleased() ? "Attempt to free released memory" :
690                            "Attempt to free non-owned memory"), N);
691      R->addRange(ArgExpr->getSourceRange());
692      R->markInteresting(Sym);
693      R->addVisitor(new MallocBugVisitor(Sym));
694      C.EmitReport(R);
695    }
696    return 0;
697  }
698
699  // Normal free.
700  if (Hold)
701    return state->set<RegionState>(Sym, RefState::getRelinquished(ParentExpr));
702  return state->set<RegionState>(Sym, RefState::getReleased(ParentExpr));
703}
704
705bool MallocChecker::SummarizeValue(raw_ostream &os, SVal V) {
706  if (nonloc::ConcreteInt *IntVal = dyn_cast<nonloc::ConcreteInt>(&V))
707    os << "an integer (" << IntVal->getValue() << ")";
708  else if (loc::ConcreteInt *ConstAddr = dyn_cast<loc::ConcreteInt>(&V))
709    os << "a constant address (" << ConstAddr->getValue() << ")";
710  else if (loc::GotoLabel *Label = dyn_cast<loc::GotoLabel>(&V))
711    os << "the address of the label '" << Label->getLabel()->getName() << "'";
712  else
713    return false;
714
715  return true;
716}
717
718bool MallocChecker::SummarizeRegion(raw_ostream &os,
719                                    const MemRegion *MR) {
720  switch (MR->getKind()) {
721  case MemRegion::FunctionTextRegionKind: {
722    const FunctionDecl *FD = cast<FunctionTextRegion>(MR)->getDecl();
723    if (FD)
724      os << "the address of the function '" << *FD << '\'';
725    else
726      os << "the address of a function";
727    return true;
728  }
729  case MemRegion::BlockTextRegionKind:
730    os << "block text";
731    return true;
732  case MemRegion::BlockDataRegionKind:
733    // FIXME: where the block came from?
734    os << "a block";
735    return true;
736  default: {
737    const MemSpaceRegion *MS = MR->getMemorySpace();
738
739    if (isa<StackLocalsSpaceRegion>(MS)) {
740      const VarRegion *VR = dyn_cast<VarRegion>(MR);
741      const VarDecl *VD;
742      if (VR)
743        VD = VR->getDecl();
744      else
745        VD = NULL;
746
747      if (VD)
748        os << "the address of the local variable '" << VD->getName() << "'";
749      else
750        os << "the address of a local stack variable";
751      return true;
752    }
753
754    if (isa<StackArgumentsSpaceRegion>(MS)) {
755      const VarRegion *VR = dyn_cast<VarRegion>(MR);
756      const VarDecl *VD;
757      if (VR)
758        VD = VR->getDecl();
759      else
760        VD = NULL;
761
762      if (VD)
763        os << "the address of the parameter '" << VD->getName() << "'";
764      else
765        os << "the address of a parameter";
766      return true;
767    }
768
769    if (isa<GlobalsSpaceRegion>(MS)) {
770      const VarRegion *VR = dyn_cast<VarRegion>(MR);
771      const VarDecl *VD;
772      if (VR)
773        VD = VR->getDecl();
774      else
775        VD = NULL;
776
777      if (VD) {
778        if (VD->isStaticLocal())
779          os << "the address of the static variable '" << VD->getName() << "'";
780        else
781          os << "the address of the global variable '" << VD->getName() << "'";
782      } else
783        os << "the address of a global variable";
784      return true;
785    }
786
787    return false;
788  }
789  }
790}
791
792void MallocChecker::ReportBadFree(CheckerContext &C, SVal ArgVal,
793                                  SourceRange range) const {
794  if (ExplodedNode *N = C.generateSink()) {
795    if (!BT_BadFree)
796      BT_BadFree.reset(new BugType("Bad free", "Memory Error"));
797
798    SmallString<100> buf;
799    llvm::raw_svector_ostream os(buf);
800
801    const MemRegion *MR = ArgVal.getAsRegion();
802    if (MR) {
803      while (const ElementRegion *ER = dyn_cast<ElementRegion>(MR))
804        MR = ER->getSuperRegion();
805
806      // Special case for alloca()
807      if (isa<AllocaRegion>(MR))
808        os << "Argument to free() was allocated by alloca(), not malloc()";
809      else {
810        os << "Argument to free() is ";
811        if (SummarizeRegion(os, MR))
812          os << ", which is not memory allocated by malloc()";
813        else
814          os << "not memory allocated by malloc()";
815      }
816    } else {
817      os << "Argument to free() is ";
818      if (SummarizeValue(os, ArgVal))
819        os << ", which is not memory allocated by malloc()";
820      else
821        os << "not memory allocated by malloc()";
822    }
823
824    BugReport *R = new BugReport(*BT_BadFree, os.str(), N);
825    R->markInteresting(MR);
826    R->addRange(range);
827    C.EmitReport(R);
828  }
829}
830
831ProgramStateRef MallocChecker::ReallocMem(CheckerContext &C,
832                                          const CallExpr *CE,
833                                          bool FreesOnFail) const {
834  if (CE->getNumArgs() < 2)
835    return 0;
836
837  ProgramStateRef state = C.getState();
838  const Expr *arg0Expr = CE->getArg(0);
839  const LocationContext *LCtx = C.getLocationContext();
840  SVal Arg0Val = state->getSVal(arg0Expr, LCtx);
841  if (!isa<DefinedOrUnknownSVal>(Arg0Val))
842    return 0;
843  DefinedOrUnknownSVal arg0Val = cast<DefinedOrUnknownSVal>(Arg0Val);
844
845  SValBuilder &svalBuilder = C.getSValBuilder();
846
847  DefinedOrUnknownSVal PtrEQ =
848    svalBuilder.evalEQ(state, arg0Val, svalBuilder.makeNull());
849
850  // Get the size argument. If there is no size arg then give up.
851  const Expr *Arg1 = CE->getArg(1);
852  if (!Arg1)
853    return 0;
854
855  // Get the value of the size argument.
856  SVal Arg1ValG = state->getSVal(Arg1, LCtx);
857  if (!isa<DefinedOrUnknownSVal>(Arg1ValG))
858    return 0;
859  DefinedOrUnknownSVal Arg1Val = cast<DefinedOrUnknownSVal>(Arg1ValG);
860
861  // Compare the size argument to 0.
862  DefinedOrUnknownSVal SizeZero =
863    svalBuilder.evalEQ(state, Arg1Val,
864                       svalBuilder.makeIntValWithPtrWidth(0, false));
865
866  ProgramStateRef StatePtrIsNull, StatePtrNotNull;
867  llvm::tie(StatePtrIsNull, StatePtrNotNull) = state->assume(PtrEQ);
868  ProgramStateRef StateSizeIsZero, StateSizeNotZero;
869  llvm::tie(StateSizeIsZero, StateSizeNotZero) = state->assume(SizeZero);
870  // We only assume exceptional states if they are definitely true; if the
871  // state is under-constrained, assume regular realloc behavior.
872  bool PrtIsNull = StatePtrIsNull && !StatePtrNotNull;
873  bool SizeIsZero = StateSizeIsZero && !StateSizeNotZero;
874
875  // If the ptr is NULL and the size is not 0, the call is equivalent to
876  // malloc(size).
877  if ( PrtIsNull && !SizeIsZero) {
878    ProgramStateRef stateMalloc = MallocMemAux(C, CE, CE->getArg(1),
879                                               UndefinedVal(), StatePtrIsNull);
880    return stateMalloc;
881  }
882
883  if (PrtIsNull && SizeIsZero)
884    return 0;
885
886  // Get the from and to pointer symbols as in toPtr = realloc(fromPtr, size).
887  assert(!PrtIsNull);
888  SymbolRef FromPtr = arg0Val.getAsSymbol();
889  SVal RetVal = state->getSVal(CE, LCtx);
890  SymbolRef ToPtr = RetVal.getAsSymbol();
891  if (!FromPtr || !ToPtr)
892    return 0;
893
894  // If the size is 0, free the memory.
895  if (SizeIsZero)
896    if (ProgramStateRef stateFree = FreeMemAux(C, CE, StateSizeIsZero,0,false)){
897      // The semantics of the return value are:
898      // If size was equal to 0, either NULL or a pointer suitable to be passed
899      // to free() is returned. We just free the input pointer and do not add
900      // any constrains on the output pointer.
901      return stateFree;
902    }
903
904  // Default behavior.
905  if (ProgramStateRef stateFree = FreeMemAux(C, CE, state, 0, false)) {
906    // FIXME: We should copy the content of the original buffer.
907    ProgramStateRef stateRealloc = MallocMemAux(C, CE, CE->getArg(1),
908                                                UnknownVal(), stateFree);
909    if (!stateRealloc)
910      return 0;
911    stateRealloc = stateRealloc->set<ReallocPairs>(ToPtr,
912                                            ReallocPair(FromPtr, FreesOnFail));
913    C.getSymbolManager().addSymbolDependency(ToPtr, FromPtr);
914    return stateRealloc;
915  }
916  return 0;
917}
918
919ProgramStateRef MallocChecker::CallocMem(CheckerContext &C, const CallExpr *CE){
920  if (CE->getNumArgs() < 2)
921    return 0;
922
923  ProgramStateRef state = C.getState();
924  SValBuilder &svalBuilder = C.getSValBuilder();
925  const LocationContext *LCtx = C.getLocationContext();
926  SVal count = state->getSVal(CE->getArg(0), LCtx);
927  SVal elementSize = state->getSVal(CE->getArg(1), LCtx);
928  SVal TotalSize = svalBuilder.evalBinOp(state, BO_Mul, count, elementSize,
929                                        svalBuilder.getContext().getSizeType());
930  SVal zeroVal = svalBuilder.makeZeroVal(svalBuilder.getContext().CharTy);
931
932  return MallocMemAux(C, CE, TotalSize, zeroVal, state);
933}
934
935LeakInfo
936MallocChecker::getAllocationSite(const ExplodedNode *N, SymbolRef Sym,
937                                 CheckerContext &C) const {
938  const LocationContext *LeakContext = N->getLocationContext();
939  // Walk the ExplodedGraph backwards and find the first node that referred to
940  // the tracked symbol.
941  const ExplodedNode *AllocNode = N;
942  const MemRegion *ReferenceRegion = 0;
943
944  while (N) {
945    ProgramStateRef State = N->getState();
946    if (!State->get<RegionState>(Sym))
947      break;
948
949    // Find the most recent expression bound to the symbol in the current
950    // context.
951    if (!ReferenceRegion) {
952      if (const MemRegion *MR = C.getLocationRegionIfPostStore(N)) {
953        SVal Val = State->getSVal(MR);
954        if (Val.getAsLocSymbol() == Sym)
955          ReferenceRegion = MR;
956      }
957    }
958
959    // Allocation node, is the last node in the current context in which the
960    // symbol was tracked.
961    if (N->getLocationContext() == LeakContext)
962      AllocNode = N;
963    N = N->pred_empty() ? NULL : *(N->pred_begin());
964  }
965
966  ProgramPoint P = AllocNode->getLocation();
967  const Stmt *AllocationStmt = 0;
968  if (CallExitEnd *Exit = dyn_cast<CallExitEnd>(&P))
969    AllocationStmt = Exit->getCalleeContext()->getCallSite();
970  else if (StmtPoint *SP = dyn_cast<StmtPoint>(&P))
971    AllocationStmt = SP->getStmt();
972
973  return LeakInfo(AllocationStmt, ReferenceRegion);
974}
975
976void MallocChecker::reportLeak(SymbolRef Sym, ExplodedNode *N,
977                               CheckerContext &C) const {
978  assert(N);
979  if (!BT_Leak) {
980    BT_Leak.reset(new BugType("Memory leak", "Memory Error"));
981    // Leaks should not be reported if they are post-dominated by a sink:
982    // (1) Sinks are higher importance bugs.
983    // (2) NoReturnFunctionChecker uses sink nodes to represent paths ending
984    //     with __noreturn functions such as assert() or exit(). We choose not
985    //     to report leaks on such paths.
986    BT_Leak->setSuppressOnSink(true);
987  }
988
989  // Most bug reports are cached at the location where they occurred.
990  // With leaks, we want to unique them by the location where they were
991  // allocated, and only report a single path.
992  PathDiagnosticLocation LocUsedForUniqueing;
993  const Stmt *AllocStmt = 0;
994  const MemRegion *Region = 0;
995  llvm::tie(AllocStmt, Region) = getAllocationSite(N, Sym, C);
996  if (AllocStmt)
997    LocUsedForUniqueing = PathDiagnosticLocation::createBegin(AllocStmt,
998                            C.getSourceManager(), N->getLocationContext());
999
1000  SmallString<200> buf;
1001  llvm::raw_svector_ostream os(buf);
1002  os << "Memory is never released; potential leak";
1003  if (Region && Region->canPrintPretty()) {
1004    os << " of memory pointed to by '";
1005    Region->printPretty(os);
1006    os << '\'';
1007  }
1008
1009  BugReport *R = new BugReport(*BT_Leak, os.str(), N, LocUsedForUniqueing);
1010  R->markInteresting(Sym);
1011  R->addVisitor(new MallocBugVisitor(Sym, true));
1012  C.EmitReport(R);
1013}
1014
1015void MallocChecker::checkDeadSymbols(SymbolReaper &SymReaper,
1016                                     CheckerContext &C) const
1017{
1018  if (!SymReaper.hasDeadSymbols())
1019    return;
1020
1021  ProgramStateRef state = C.getState();
1022  RegionStateTy RS = state->get<RegionState>();
1023  RegionStateTy::Factory &F = state->get_context<RegionState>();
1024
1025  bool generateReport = false;
1026  llvm::SmallVector<SymbolRef, 2> Errors;
1027  for (RegionStateTy::iterator I = RS.begin(), E = RS.end(); I != E; ++I) {
1028    if (SymReaper.isDead(I->first)) {
1029      if (I->second.isAllocated()) {
1030        generateReport = true;
1031        Errors.push_back(I->first);
1032      }
1033      // Remove the dead symbol from the map.
1034      RS = F.remove(RS, I->first);
1035
1036    }
1037  }
1038
1039  // Cleanup the Realloc Pairs Map.
1040  ReallocMap RP = state->get<ReallocPairs>();
1041  for (ReallocMap::iterator I = RP.begin(), E = RP.end(); I != E; ++I) {
1042    if (SymReaper.isDead(I->first) ||
1043        SymReaper.isDead(I->second.ReallocatedSym)) {
1044      state = state->remove<ReallocPairs>(I->first);
1045    }
1046  }
1047
1048  // Generate leak node.
1049  static SimpleProgramPointTag Tag("MallocChecker : DeadSymbolsLeak");
1050  ExplodedNode *N = C.addTransition(C.getState(), C.getPredecessor(), &Tag);
1051
1052  if (generateReport) {
1053    for (llvm::SmallVector<SymbolRef, 2>::iterator
1054         I = Errors.begin(), E = Errors.end(); I != E; ++I) {
1055      reportLeak(*I, N, C);
1056    }
1057  }
1058  C.addTransition(state->set<RegionState>(RS), N);
1059}
1060
1061void MallocChecker::checkEndPath(CheckerContext &C) const {
1062  ProgramStateRef state = C.getState();
1063  RegionStateTy M = state->get<RegionState>();
1064
1065  // If inside inlined call, skip it.
1066  if (C.getLocationContext()->getParent() != 0)
1067    return;
1068
1069  for (RegionStateTy::iterator I = M.begin(), E = M.end(); I != E; ++I) {
1070    RefState RS = I->second;
1071    if (RS.isAllocated()) {
1072      ExplodedNode *N = C.addTransition(state);
1073      if (N)
1074        reportLeak(I->first, N, C);
1075    }
1076  }
1077}
1078
1079bool MallocChecker::checkEscape(SymbolRef Sym, const Stmt *S,
1080                                CheckerContext &C) const {
1081  ProgramStateRef state = C.getState();
1082  const RefState *RS = state->get<RegionState>(Sym);
1083  if (!RS)
1084    return false;
1085
1086  if (RS->isAllocated()) {
1087    state = state->set<RegionState>(Sym, RefState::getEscaped(S));
1088    C.addTransition(state);
1089    return true;
1090  }
1091  return false;
1092}
1093
1094void MallocChecker::checkPreStmt(const CallExpr *CE, CheckerContext &C) const {
1095  // We will check for double free in the post visit.
1096  if (isFreeFunction(C.getCalleeDecl(CE), C.getASTContext()))
1097    return;
1098
1099  // Check use after free, when a freed pointer is passed to a call.
1100  ProgramStateRef State = C.getState();
1101  for (CallExpr::const_arg_iterator I = CE->arg_begin(),
1102                                    E = CE->arg_end(); I != E; ++I) {
1103    const Expr *A = *I;
1104    if (A->getType().getTypePtr()->isAnyPointerType()) {
1105      SymbolRef Sym = State->getSVal(A, C.getLocationContext()).getAsSymbol();
1106      if (!Sym)
1107        continue;
1108      if (checkUseAfterFree(Sym, C, A))
1109        return;
1110    }
1111  }
1112}
1113
1114void MallocChecker::checkPreStmt(const ReturnStmt *S, CheckerContext &C) const {
1115  const Expr *E = S->getRetValue();
1116  if (!E)
1117    return;
1118
1119  // Check if we are returning a symbol.
1120  ProgramStateRef State = C.getState();
1121  SVal RetVal = State->getSVal(E, C.getLocationContext());
1122  SymbolRef Sym = RetVal.getAsSymbol();
1123  if (!Sym)
1124    // If we are returning a field of the allocated struct or an array element,
1125    // the callee could still free the memory.
1126    // TODO: This logic should be a part of generic symbol escape callback.
1127    if (const MemRegion *MR = RetVal.getAsRegion())
1128      if (isa<FieldRegion>(MR) || isa<ElementRegion>(MR))
1129        if (const SymbolicRegion *BMR =
1130              dyn_cast<SymbolicRegion>(MR->getBaseRegion()))
1131          Sym = BMR->getSymbol();
1132
1133  // Check if we are returning freed memory.
1134  if (Sym)
1135    if (checkUseAfterFree(Sym, C, E))
1136      return;
1137
1138  // If this function body is not inlined, stop tracking any returned symbols.
1139  if (C.getLocationContext()->getParent() == 0) {
1140    State =
1141      State->scanReachableSymbols<StopTrackingCallback>(RetVal).getState();
1142    C.addTransition(State);
1143  }
1144}
1145
1146// TODO: Blocks should be either inlined or should call invalidate regions
1147// upon invocation. After that's in place, special casing here will not be
1148// needed.
1149void MallocChecker::checkPostStmt(const BlockExpr *BE,
1150                                  CheckerContext &C) const {
1151
1152  // Scan the BlockDecRefExprs for any object the retain count checker
1153  // may be tracking.
1154  if (!BE->getBlockDecl()->hasCaptures())
1155    return;
1156
1157  ProgramStateRef state = C.getState();
1158  const BlockDataRegion *R =
1159    cast<BlockDataRegion>(state->getSVal(BE,
1160                                         C.getLocationContext()).getAsRegion());
1161
1162  BlockDataRegion::referenced_vars_iterator I = R->referenced_vars_begin(),
1163                                            E = R->referenced_vars_end();
1164
1165  if (I == E)
1166    return;
1167
1168  SmallVector<const MemRegion*, 10> Regions;
1169  const LocationContext *LC = C.getLocationContext();
1170  MemRegionManager &MemMgr = C.getSValBuilder().getRegionManager();
1171
1172  for ( ; I != E; ++I) {
1173    const VarRegion *VR = *I;
1174    if (VR->getSuperRegion() == R) {
1175      VR = MemMgr.getVarRegion(VR->getDecl(), LC);
1176    }
1177    Regions.push_back(VR);
1178  }
1179
1180  state =
1181    state->scanReachableSymbols<StopTrackingCallback>(Regions.data(),
1182                                    Regions.data() + Regions.size()).getState();
1183  C.addTransition(state);
1184}
1185
1186bool MallocChecker::isReleased(SymbolRef Sym, CheckerContext &C) const {
1187  assert(Sym);
1188  const RefState *RS = C.getState()->get<RegionState>(Sym);
1189  return (RS && RS->isReleased());
1190}
1191
1192bool MallocChecker::checkUseAfterFree(SymbolRef Sym, CheckerContext &C,
1193                                      const Stmt *S) const {
1194  if (isReleased(Sym, C)) {
1195    if (ExplodedNode *N = C.generateSink()) {
1196      if (!BT_UseFree)
1197        BT_UseFree.reset(new BugType("Use-after-free", "Memory Error"));
1198
1199      BugReport *R = new BugReport(*BT_UseFree,
1200                                   "Use of memory after it is freed",N);
1201      if (S)
1202        R->addRange(S->getSourceRange());
1203      R->markInteresting(Sym);
1204      R->addVisitor(new MallocBugVisitor(Sym));
1205      C.EmitReport(R);
1206      return true;
1207    }
1208  }
1209  return false;
1210}
1211
1212// Check if the location is a freed symbolic region.
1213void MallocChecker::checkLocation(SVal l, bool isLoad, const Stmt *S,
1214                                  CheckerContext &C) const {
1215  SymbolRef Sym = l.getLocSymbolInBase();
1216  if (Sym)
1217    checkUseAfterFree(Sym, C, S);
1218}
1219
1220//===----------------------------------------------------------------------===//
1221// Check various ways a symbol can be invalidated.
1222// TODO: This logic (the next 3 functions) is copied/similar to the
1223// RetainRelease checker. We might want to factor this out.
1224//===----------------------------------------------------------------------===//
1225
1226// Stop tracking symbols when a value escapes as a result of checkBind.
1227// A value escapes in three possible cases:
1228// (1) we are binding to something that is not a memory region.
1229// (2) we are binding to a memregion that does not have stack storage
1230// (3) we are binding to a memregion with stack storage that the store
1231//     does not understand.
1232void MallocChecker::checkBind(SVal loc, SVal val, const Stmt *S,
1233                              CheckerContext &C) const {
1234  // Are we storing to something that causes the value to "escape"?
1235  bool escapes = true;
1236  ProgramStateRef state = C.getState();
1237
1238  if (loc::MemRegionVal *regionLoc = dyn_cast<loc::MemRegionVal>(&loc)) {
1239    escapes = !regionLoc->getRegion()->hasStackStorage();
1240
1241    if (!escapes) {
1242      // To test (3), generate a new state with the binding added.  If it is
1243      // the same state, then it escapes (since the store cannot represent
1244      // the binding).
1245      // Do this only if we know that the store is not supposed to generate the
1246      // same state.
1247      SVal StoredVal = state->getSVal(regionLoc->getRegion());
1248      if (StoredVal != val)
1249        escapes = (state == (state->bindLoc(*regionLoc, val)));
1250    }
1251  }
1252
1253  // If our store can represent the binding and we aren't storing to something
1254  // that doesn't have local storage then just return and have the simulation
1255  // state continue as is.
1256  if (!escapes)
1257      return;
1258
1259  // Otherwise, find all symbols referenced by 'val' that we are tracking
1260  // and stop tracking them.
1261  state = state->scanReachableSymbols<StopTrackingCallback>(val).getState();
1262  C.addTransition(state);
1263}
1264
1265// If a symbolic region is assumed to NULL (or another constant), stop tracking
1266// it - assuming that allocation failed on this path.
1267ProgramStateRef MallocChecker::evalAssume(ProgramStateRef state,
1268                                              SVal Cond,
1269                                              bool Assumption) const {
1270  RegionStateTy RS = state->get<RegionState>();
1271  for (RegionStateTy::iterator I = RS.begin(), E = RS.end(); I != E; ++I) {
1272    // If the symbol is assumed to NULL or another constant, this will
1273    // return an APSInt*.
1274    if (state->getSymVal(I.getKey()))
1275      state = state->remove<RegionState>(I.getKey());
1276  }
1277
1278  // Realloc returns 0 when reallocation fails, which means that we should
1279  // restore the state of the pointer being reallocated.
1280  ReallocMap RP = state->get<ReallocPairs>();
1281  for (ReallocMap::iterator I = RP.begin(), E = RP.end(); I != E; ++I) {
1282    // If the symbol is assumed to NULL or another constant, this will
1283    // return an APSInt*.
1284    if (state->getSymVal(I.getKey())) {
1285      SymbolRef ReallocSym = I.getData().ReallocatedSym;
1286      const RefState *RS = state->get<RegionState>(ReallocSym);
1287      if (RS) {
1288        if (RS->isReleased() && ! I.getData().IsFreeOnFailure)
1289          state = state->set<RegionState>(ReallocSym,
1290                             RefState::getAllocated(RS->getStmt()));
1291      }
1292      state = state->remove<ReallocPairs>(I.getKey());
1293    }
1294  }
1295
1296  return state;
1297}
1298
1299// Check if the function is known to us. So, for example, we could
1300// conservatively assume it can free/reallocate its pointer arguments.
1301// (We assume that the pointers cannot escape through calls to system
1302// functions not handled by this checker.)
1303bool MallocChecker::doesNotFreeMemory(const CallEvent *Call,
1304                                      ProgramStateRef State) const {
1305  assert(Call);
1306
1307  // For now, assume that any C++ call can free memory.
1308  // TODO: If we want to be more optimistic here, we'll need to make sure that
1309  // regions escape to C++ containers. They seem to do that even now, but for
1310  // mysterious reasons.
1311  if (!(isa<FunctionCall>(Call) || isa<ObjCMethodCall>(Call)))
1312    return false;
1313
1314  // Check Objective-C messages by selector name.
1315  if (const ObjCMethodCall *Msg = dyn_cast<ObjCMethodCall>(Call)) {
1316    // If it's not a framework call, or if it takes a callback, assume it
1317    // can free memory.
1318    if (!Call->isInSystemHeader() || Call->hasNonZeroCallbackArg())
1319      return false;
1320
1321    Selector S = Msg->getSelector();
1322
1323    // Whitelist the ObjC methods which do free memory.
1324    // - Anything containing 'freeWhenDone' param set to 1.
1325    //   Ex: dataWithBytesNoCopy:length:freeWhenDone.
1326    for (unsigned i = 1; i < S.getNumArgs(); ++i) {
1327      if (S.getNameForSlot(i).equals("freeWhenDone")) {
1328        if (Call->getArgSVal(i).isConstant(1))
1329          return false;
1330        else
1331          return true;
1332      }
1333    }
1334
1335    // If the first selector ends with NoCopy, assume that the ownership is
1336    // transferred as well.
1337    // Ex:  [NSData dataWithBytesNoCopy:bytes length:10];
1338    StringRef FirstSlot = S.getNameForSlot(0);
1339    if (FirstSlot.endswith("NoCopy"))
1340      return false;
1341
1342    // If the first selector starts with addPointer, insertPointer,
1343    // or replacePointer, assume we are dealing with NSPointerArray or similar.
1344    // This is similar to C++ containers (vector); we still might want to check
1345    // that the pointers get freed by following the container itself.
1346    if (FirstSlot.startswith("addPointer") ||
1347        FirstSlot.startswith("insertPointer") ||
1348        FirstSlot.startswith("replacePointer")) {
1349      return false;
1350    }
1351
1352    // Otherwise, assume that the method does not free memory.
1353    // Most framework methods do not free memory.
1354    return true;
1355  }
1356
1357  // At this point the only thing left to handle is straight function calls.
1358  const FunctionDecl *FD = cast<FunctionCall>(Call)->getDecl();
1359  if (!FD)
1360    return false;
1361
1362  ASTContext &ASTC = State->getStateManager().getContext();
1363
1364  // If it's one of the allocation functions we can reason about, we model
1365  // its behavior explicitly.
1366  if (isMemFunction(FD, ASTC))
1367    return true;
1368
1369  // If it's not a system call, assume it frees memory.
1370  if (!Call->isInSystemHeader())
1371    return false;
1372
1373  // White list the system functions whose arguments escape.
1374  const IdentifierInfo *II = FD->getIdentifier();
1375  if (!II)
1376    return false;
1377  StringRef FName = II->getName();
1378
1379  // White list the 'XXXNoCopy' CoreFoundation functions.
1380  // We specifically check these before
1381  if (FName.endswith("NoCopy")) {
1382    // Look for the deallocator argument. We know that the memory ownership
1383    // is not transferred only if the deallocator argument is
1384    // 'kCFAllocatorNull'.
1385    for (unsigned i = 1; i < Call->getNumArgs(); ++i) {
1386      const Expr *ArgE = Call->getArgExpr(i)->IgnoreParenCasts();
1387      if (const DeclRefExpr *DE = dyn_cast<DeclRefExpr>(ArgE)) {
1388        StringRef DeallocatorName = DE->getFoundDecl()->getName();
1389        if (DeallocatorName == "kCFAllocatorNull")
1390          return true;
1391      }
1392    }
1393    return false;
1394  }
1395
1396  // Associating streams with malloced buffers. The pointer can escape if
1397  // 'closefn' is specified (and if that function does free memory),
1398  // but it will not if closefn is not specified.
1399  // Currently, we do not inspect the 'closefn' function (PR12101).
1400  if (FName == "funopen")
1401    if (Call->getNumArgs() >= 4 && Call->getArgSVal(4).isConstant(0))
1402      return true;
1403
1404  // Do not warn on pointers passed to 'setbuf' when used with std streams,
1405  // these leaks might be intentional when setting the buffer for stdio.
1406  // http://stackoverflow.com/questions/2671151/who-frees-setvbuf-buffer
1407  if (FName == "setbuf" || FName =="setbuffer" ||
1408      FName == "setlinebuf" || FName == "setvbuf") {
1409    if (Call->getNumArgs() >= 1) {
1410      const Expr *ArgE = Call->getArgExpr(0)->IgnoreParenCasts();
1411      if (const DeclRefExpr *ArgDRE = dyn_cast<DeclRefExpr>(ArgE))
1412        if (const VarDecl *D = dyn_cast<VarDecl>(ArgDRE->getDecl()))
1413          if (D->getCanonicalDecl()->getName().find("std") != StringRef::npos)
1414            return false;
1415    }
1416  }
1417
1418  // A bunch of other functions which either take ownership of a pointer or
1419  // wrap the result up in a struct or object, meaning it can be freed later.
1420  // (See RetainCountChecker.) Not all the parameters here are invalidated,
1421  // but the Malloc checker cannot differentiate between them. The right way
1422  // of doing this would be to implement a pointer escapes callback.
1423  if (FName == "CGBitmapContextCreate" ||
1424      FName == "CGBitmapContextCreateWithData" ||
1425      FName == "CVPixelBufferCreateWithBytes" ||
1426      FName == "CVPixelBufferCreateWithPlanarBytes" ||
1427      FName == "OSAtomicEnqueue") {
1428    return false;
1429  }
1430
1431  // Handle cases where we know a buffer's /address/ can escape.
1432  // Note that the above checks handle some special cases where we know that
1433  // even though the address escapes, it's still our responsibility to free the
1434  // buffer.
1435  if (Call->argumentsMayEscape())
1436    return false;
1437
1438  // Otherwise, assume that the function does not free memory.
1439  // Most system calls do not free the memory.
1440  return true;
1441}
1442
1443// If the symbol we are tracking is invalidated, but not explicitly (ex: the &p
1444// escapes, when we are tracking p), do not track the symbol as we cannot reason
1445// about it anymore.
1446ProgramStateRef
1447MallocChecker::checkRegionChanges(ProgramStateRef State,
1448                            const StoreManager::InvalidatedSymbols *invalidated,
1449                                    ArrayRef<const MemRegion *> ExplicitRegions,
1450                                    ArrayRef<const MemRegion *> Regions,
1451                                    const CallEvent *Call) const {
1452  if (!invalidated || invalidated->empty())
1453    return State;
1454  llvm::SmallPtrSet<SymbolRef, 8> WhitelistedSymbols;
1455
1456  // If it's a call which might free or reallocate memory, we assume that all
1457  // regions (explicit and implicit) escaped.
1458
1459  // Otherwise, whitelist explicit pointers; we still can track them.
1460  if (!Call || doesNotFreeMemory(Call, State)) {
1461    for (ArrayRef<const MemRegion *>::iterator I = ExplicitRegions.begin(),
1462        E = ExplicitRegions.end(); I != E; ++I) {
1463      if (const SymbolicRegion *R = (*I)->StripCasts()->getAs<SymbolicRegion>())
1464        WhitelistedSymbols.insert(R->getSymbol());
1465    }
1466  }
1467
1468  for (StoreManager::InvalidatedSymbols::const_iterator I=invalidated->begin(),
1469       E = invalidated->end(); I!=E; ++I) {
1470    SymbolRef sym = *I;
1471    if (WhitelistedSymbols.count(sym))
1472      continue;
1473    // The symbol escaped. Note, we assume that if the symbol is released,
1474    // passing it out will result in a use after free. We also keep tracking
1475    // relinquished symbols.
1476    if (const RefState *RS = State->get<RegionState>(sym)) {
1477      if (RS->isAllocated())
1478        State = State->set<RegionState>(sym,
1479                                        RefState::getEscaped(RS->getStmt()));
1480    }
1481  }
1482  return State;
1483}
1484
1485static SymbolRef findFailedReallocSymbol(ProgramStateRef currState,
1486                                         ProgramStateRef prevState) {
1487  ReallocMap currMap = currState->get<ReallocPairs>();
1488  ReallocMap prevMap = prevState->get<ReallocPairs>();
1489
1490  for (ReallocMap::iterator I = prevMap.begin(), E = prevMap.end();
1491       I != E; ++I) {
1492    SymbolRef sym = I.getKey();
1493    if (!currMap.lookup(sym))
1494      return sym;
1495  }
1496
1497  return NULL;
1498}
1499
1500PathDiagnosticPiece *
1501MallocChecker::MallocBugVisitor::VisitNode(const ExplodedNode *N,
1502                                           const ExplodedNode *PrevN,
1503                                           BugReporterContext &BRC,
1504                                           BugReport &BR) {
1505  ProgramStateRef state = N->getState();
1506  ProgramStateRef statePrev = PrevN->getState();
1507
1508  const RefState *RS = state->get<RegionState>(Sym);
1509  const RefState *RSPrev = statePrev->get<RegionState>(Sym);
1510  if (!RS)
1511    return 0;
1512
1513  const Stmt *S = 0;
1514  const char *Msg = 0;
1515  StackHintGeneratorForSymbol *StackHint = 0;
1516
1517  // Retrieve the associated statement.
1518  ProgramPoint ProgLoc = N->getLocation();
1519  if (StmtPoint *SP = dyn_cast<StmtPoint>(&ProgLoc))
1520    S = SP->getStmt();
1521  else if (CallExitEnd *Exit = dyn_cast<CallExitEnd>(&ProgLoc))
1522    S = Exit->getCalleeContext()->getCallSite();
1523  // If an assumption was made on a branch, it should be caught
1524  // here by looking at the state transition.
1525  else if (BlockEdge *Edge = dyn_cast<BlockEdge>(&ProgLoc)) {
1526    const CFGBlock *srcBlk = Edge->getSrc();
1527    S = srcBlk->getTerminator();
1528  }
1529  if (!S)
1530    return 0;
1531
1532  // FIXME: We will eventually need to handle non-statement-based events
1533  // (__attribute__((cleanup))).
1534
1535  // Find out if this is an interesting point and what is the kind.
1536  if (Mode == Normal) {
1537    if (isAllocated(RS, RSPrev, S)) {
1538      Msg = "Memory is allocated";
1539      StackHint = new StackHintGeneratorForSymbol(Sym,
1540                                                  "Returned allocated memory");
1541    } else if (isReleased(RS, RSPrev, S)) {
1542      Msg = "Memory is released";
1543      StackHint = new StackHintGeneratorForSymbol(Sym,
1544                                                  "Returned released memory");
1545    } else if (isRelinquished(RS, RSPrev, S)) {
1546      Msg = "Memory ownership is transfered";
1547      StackHint = new StackHintGeneratorForSymbol(Sym, "");
1548    } else if (isReallocFailedCheck(RS, RSPrev, S)) {
1549      Mode = ReallocationFailed;
1550      Msg = "Reallocation failed";
1551      StackHint = new StackHintGeneratorForReallocationFailed(Sym,
1552                                                       "Reallocation failed");
1553
1554      if (SymbolRef sym = findFailedReallocSymbol(state, statePrev)) {
1555        // Is it possible to fail two reallocs WITHOUT testing in between?
1556        assert((!FailedReallocSymbol || FailedReallocSymbol == sym) &&
1557          "We only support one failed realloc at a time.");
1558        BR.markInteresting(sym);
1559        FailedReallocSymbol = sym;
1560      }
1561    }
1562
1563  // We are in a special mode if a reallocation failed later in the path.
1564  } else if (Mode == ReallocationFailed) {
1565    assert(FailedReallocSymbol && "No symbol to look for.");
1566
1567    // Is this is the first appearance of the reallocated symbol?
1568    if (!statePrev->get<RegionState>(FailedReallocSymbol)) {
1569      // We're at the reallocation point.
1570      Msg = "Attempt to reallocate memory";
1571      StackHint = new StackHintGeneratorForSymbol(Sym,
1572                                                 "Returned reallocated memory");
1573      FailedReallocSymbol = NULL;
1574      Mode = Normal;
1575    }
1576  }
1577
1578  if (!Msg)
1579    return 0;
1580  assert(StackHint);
1581
1582  // Generate the extra diagnostic.
1583  PathDiagnosticLocation Pos(S, BRC.getSourceManager(),
1584                             N->getLocationContext());
1585  return new PathDiagnosticEventPiece(Pos, Msg, true, StackHint);
1586}
1587
1588void MallocChecker::printState(raw_ostream &Out, ProgramStateRef State,
1589                               const char *NL, const char *Sep) const {
1590
1591  RegionStateTy RS = State->get<RegionState>();
1592
1593  if (!RS.isEmpty())
1594    Out << "Has Malloc data" << NL;
1595}
1596
1597#define REGISTER_CHECKER(name) \
1598void ento::register##name(CheckerManager &mgr) {\
1599  registerCStringCheckerBasic(mgr); \
1600  mgr.registerChecker<MallocChecker>()->Filter.C##name = true;\
1601}
1602
1603REGISTER_CHECKER(MallocPessimistic)
1604REGISTER_CHECKER(MallocOptimistic)
1605