1//== NullDerefChecker.cpp - Null dereference checker ------------*- C++ -*--==//
2//
3//                     The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This defines NullDerefChecker, a builtin check in ExprEngine that performs
11// checks for null pointers at loads and stores.
12//
13//===----------------------------------------------------------------------===//
14
15#include "ClangSACheckers.h"
16#include "clang/AST/ExprObjC.h"
17#include "clang/StaticAnalyzer/Core/BugReporter/BugType.h"
18#include "clang/StaticAnalyzer/Core/Checker.h"
19#include "clang/StaticAnalyzer/Core/CheckerManager.h"
20#include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h"
21#include "llvm/ADT/SmallString.h"
22#include "llvm/Support/raw_ostream.h"
23
24using namespace clang;
25using namespace ento;
26
27namespace {
28class DereferenceChecker
29    : public Checker< check::Location,
30                      check::Bind,
31                      EventDispatcher<ImplicitNullDerefEvent> > {
32  mutable OwningPtr<BuiltinBug> BT_null;
33  mutable OwningPtr<BuiltinBug> BT_undef;
34
35  void reportBug(ProgramStateRef State, const Stmt *S, CheckerContext &C,
36                 bool IsBind = false) const;
37
38public:
39  void checkLocation(SVal location, bool isLoad, const Stmt* S,
40                     CheckerContext &C) const;
41  void checkBind(SVal L, SVal V, const Stmt *S, CheckerContext &C) const;
42
43  static void AddDerefSource(raw_ostream &os,
44                             SmallVectorImpl<SourceRange> &Ranges,
45                             const Expr *Ex, const ProgramState *state,
46                             const LocationContext *LCtx,
47                             bool loadedFrom = false);
48};
49} // end anonymous namespace
50
51void
52DereferenceChecker::AddDerefSource(raw_ostream &os,
53                                   SmallVectorImpl<SourceRange> &Ranges,
54                                   const Expr *Ex,
55                                   const ProgramState *state,
56                                   const LocationContext *LCtx,
57                                   bool loadedFrom) {
58  Ex = Ex->IgnoreParenLValueCasts();
59  switch (Ex->getStmtClass()) {
60    default:
61      break;
62    case Stmt::DeclRefExprClass: {
63      const DeclRefExpr *DR = cast<DeclRefExpr>(Ex);
64      if (const VarDecl *VD = dyn_cast<VarDecl>(DR->getDecl())) {
65        os << " (" << (loadedFrom ? "loaded from" : "from")
66           << " variable '" <<  VD->getName() << "')";
67        Ranges.push_back(DR->getSourceRange());
68      }
69      break;
70    }
71    case Stmt::MemberExprClass: {
72      const MemberExpr *ME = cast<MemberExpr>(Ex);
73      os << " (" << (loadedFrom ? "loaded from" : "via")
74         << " field '" << ME->getMemberNameInfo() << "')";
75      SourceLocation L = ME->getMemberLoc();
76      Ranges.push_back(SourceRange(L, L));
77      break;
78    }
79    case Stmt::ObjCIvarRefExprClass: {
80      const ObjCIvarRefExpr *IV = cast<ObjCIvarRefExpr>(Ex);
81      os << " (" << (loadedFrom ? "loaded from" : "via")
82         << " ivar '" << IV->getDecl()->getName() << "')";
83      SourceLocation L = IV->getLocation();
84      Ranges.push_back(SourceRange(L, L));
85      break;
86    }
87  }
88}
89
90void DereferenceChecker::reportBug(ProgramStateRef State, const Stmt *S,
91                                   CheckerContext &C, bool IsBind) const {
92  // Generate an error node.
93  ExplodedNode *N = C.generateSink(State);
94  if (!N)
95    return;
96
97  // We know that 'location' cannot be non-null.  This is what
98  // we call an "explicit" null dereference.
99  if (!BT_null)
100    BT_null.reset(new BuiltinBug("Dereference of null pointer"));
101
102  SmallString<100> buf;
103  llvm::raw_svector_ostream os(buf);
104
105  SmallVector<SourceRange, 2> Ranges;
106
107  // Walk through lvalue casts to get the original expression
108  // that syntactically caused the load.
109  if (const Expr *expr = dyn_cast<Expr>(S))
110    S = expr->IgnoreParenLValueCasts();
111
112  if (IsBind) {
113    if (const BinaryOperator *BO = dyn_cast<BinaryOperator>(S)) {
114      if (BO->isAssignmentOp())
115        S = BO->getRHS();
116    } else if (const DeclStmt *DS = dyn_cast<DeclStmt>(S)) {
117      assert(DS->isSingleDecl() && "We process decls one by one");
118      if (const VarDecl *VD = dyn_cast<VarDecl>(DS->getSingleDecl()))
119        if (const Expr *Init = VD->getAnyInitializer())
120          S = Init;
121    }
122  }
123
124  switch (S->getStmtClass()) {
125  case Stmt::ArraySubscriptExprClass: {
126    os << "Array access";
127    const ArraySubscriptExpr *AE = cast<ArraySubscriptExpr>(S);
128    AddDerefSource(os, Ranges, AE->getBase()->IgnoreParenCasts(),
129                   State.getPtr(), N->getLocationContext());
130    os << " results in a null pointer dereference";
131    break;
132  }
133  case Stmt::UnaryOperatorClass: {
134    os << "Dereference of null pointer";
135    const UnaryOperator *U = cast<UnaryOperator>(S);
136    AddDerefSource(os, Ranges, U->getSubExpr()->IgnoreParens(),
137                   State.getPtr(), N->getLocationContext(), true);
138    break;
139  }
140  case Stmt::MemberExprClass: {
141    const MemberExpr *M = cast<MemberExpr>(S);
142    if (M->isArrow() || bugreporter::isDeclRefExprToReference(M->getBase())) {
143      os << "Access to field '" << M->getMemberNameInfo()
144         << "' results in a dereference of a null pointer";
145      AddDerefSource(os, Ranges, M->getBase()->IgnoreParenCasts(),
146                     State.getPtr(), N->getLocationContext(), true);
147    }
148    break;
149  }
150  case Stmt::ObjCIvarRefExprClass: {
151    const ObjCIvarRefExpr *IV = cast<ObjCIvarRefExpr>(S);
152    os << "Access to instance variable '" << *IV->getDecl()
153       << "' results in a dereference of a null pointer";
154    AddDerefSource(os, Ranges, IV->getBase()->IgnoreParenCasts(),
155                   State.getPtr(), N->getLocationContext(), true);
156    break;
157  }
158  default:
159    break;
160  }
161
162  os.flush();
163  BugReport *report =
164    new BugReport(*BT_null,
165                  buf.empty() ? BT_null->getDescription() : buf.str(),
166                  N);
167
168  bugreporter::trackNullOrUndefValue(N, bugreporter::getDerefExpr(S), *report);
169
170  for (SmallVectorImpl<SourceRange>::iterator
171       I = Ranges.begin(), E = Ranges.end(); I!=E; ++I)
172    report->addRange(*I);
173
174  C.emitReport(report);
175}
176
177void DereferenceChecker::checkLocation(SVal l, bool isLoad, const Stmt* S,
178                                       CheckerContext &C) const {
179  // Check for dereference of an undefined value.
180  if (l.isUndef()) {
181    if (ExplodedNode *N = C.generateSink()) {
182      if (!BT_undef)
183        BT_undef.reset(new BuiltinBug("Dereference of undefined pointer value"));
184
185      BugReport *report =
186        new BugReport(*BT_undef, BT_undef->getDescription(), N);
187      bugreporter::trackNullOrUndefValue(N, bugreporter::getDerefExpr(S),
188                                         *report);
189      C.emitReport(report);
190    }
191    return;
192  }
193
194  DefinedOrUnknownSVal location = l.castAs<DefinedOrUnknownSVal>();
195
196  // Check for null dereferences.
197  if (!location.getAs<Loc>())
198    return;
199
200  ProgramStateRef state = C.getState();
201
202  ProgramStateRef notNullState, nullState;
203  llvm::tie(notNullState, nullState) = state->assume(location);
204
205  // The explicit NULL case.
206  if (nullState) {
207    if (!notNullState) {
208      reportBug(nullState, S, C);
209      return;
210    }
211
212    // Otherwise, we have the case where the location could either be
213    // null or not-null.  Record the error node as an "implicit" null
214    // dereference.
215    if (ExplodedNode *N = C.generateSink(nullState)) {
216      ImplicitNullDerefEvent event = { l, isLoad, N, &C.getBugReporter() };
217      dispatchEvent(event);
218    }
219  }
220
221  // From this point forward, we know that the location is not null.
222  C.addTransition(notNullState);
223}
224
225void DereferenceChecker::checkBind(SVal L, SVal V, const Stmt *S,
226                                   CheckerContext &C) const {
227  // If we're binding to a reference, check if the value is known to be null.
228  if (V.isUndef())
229    return;
230
231  const MemRegion *MR = L.getAsRegion();
232  const TypedValueRegion *TVR = dyn_cast_or_null<TypedValueRegion>(MR);
233  if (!TVR)
234    return;
235
236  if (!TVR->getValueType()->isReferenceType())
237    return;
238
239  ProgramStateRef State = C.getState();
240
241  ProgramStateRef StNonNull, StNull;
242  llvm::tie(StNonNull, StNull) =
243      State->assume(V.castAs<DefinedOrUnknownSVal>());
244
245  if (StNull) {
246    if (!StNonNull) {
247      reportBug(StNull, S, C, /*isBind=*/true);
248      return;
249    }
250
251    // At this point the value could be either null or non-null.
252    // Record this as an "implicit" null dereference.
253    if (ExplodedNode *N = C.generateSink(StNull)) {
254      ImplicitNullDerefEvent event = { V, /*isLoad=*/true, N,
255                                       &C.getBugReporter() };
256      dispatchEvent(event);
257    }
258  }
259
260  // Unlike a regular null dereference, initializing a reference with a
261  // dereferenced null pointer does not actually cause a runtime exception in
262  // Clang's implementation of references.
263  //
264  //   int &r = *p; // safe??
265  //   if (p != NULL) return; // uh-oh
266  //   r = 5; // trap here
267  //
268  // The standard says this is invalid as soon as we try to create a "null
269  // reference" (there is no such thing), but turning this into an assumption
270  // that 'p' is never null will not match our actual runtime behavior.
271  // So we do not record this assumption, allowing us to warn on the last line
272  // of this example.
273  //
274  // We do need to add a transition because we may have generated a sink for
275  // the "implicit" null dereference.
276  C.addTransition(State, this);
277}
278
279void ento::registerDereferenceChecker(CheckerManager &mgr) {
280  mgr.registerChecker<DereferenceChecker>();
281}
282