Home | History | Annotate | Download | only in Checkers
      1 //===--- CallAndMessageChecker.cpp ------------------------------*- C++ -*--==//
      2 //
      3 //                     The LLVM Compiler Infrastructure
      4 //
      5 // This file is distributed under the University of Illinois Open Source
      6 // License. See LICENSE.TXT for details.
      7 //
      8 //===----------------------------------------------------------------------===//
      9 //
     10 // This defines CallAndMessageChecker, a builtin checker that checks for various
     11 // errors of call and objc message expressions.
     12 //
     13 //===----------------------------------------------------------------------===//
     14 
     15 #include "ClangSACheckers.h"
     16 #include "clang/StaticAnalyzer/Core/Checker.h"
     17 #include "clang/StaticAnalyzer/Core/CheckerManager.h"
     18 #include "clang/StaticAnalyzer/Core/PathSensitive/CallEvent.h"
     19 #include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h"
     20 #include "clang/StaticAnalyzer/Core/BugReporter/BugType.h"
     21 #include "clang/AST/ParentMap.h"
     22 #include "clang/Basic/TargetInfo.h"
     23 #include "llvm/ADT/SmallString.h"
     24 
     25 using namespace clang;
     26 using namespace ento;
     27 
     28 namespace {
     29 class CallAndMessageChecker
     30   : public Checker< check::PreStmt<CallExpr>, check::PreObjCMessage,
     31                     check::PreCall > {
     32   mutable OwningPtr<BugType> BT_call_null;
     33   mutable OwningPtr<BugType> BT_call_undef;
     34   mutable OwningPtr<BugType> BT_cxx_call_null;
     35   mutable OwningPtr<BugType> BT_cxx_call_undef;
     36   mutable OwningPtr<BugType> BT_call_arg;
     37   mutable OwningPtr<BugType> BT_msg_undef;
     38   mutable OwningPtr<BugType> BT_objc_prop_undef;
     39   mutable OwningPtr<BugType> BT_objc_subscript_undef;
     40   mutable OwningPtr<BugType> BT_msg_arg;
     41   mutable OwningPtr<BugType> BT_msg_ret;
     42 public:
     43 
     44   void checkPreStmt(const CallExpr *CE, CheckerContext &C) const;
     45   void checkPreObjCMessage(const ObjCMethodCall &msg, CheckerContext &C) const;
     46   void checkPreCall(const CallEvent &Call, CheckerContext &C) const;
     47 
     48 private:
     49   static bool PreVisitProcessArg(CheckerContext &C, SVal V,
     50                                  SourceRange argRange, const Expr *argEx,
     51                                  bool IsFirstArgument, bool checkUninitFields,
     52                                  const CallEvent &Call, OwningPtr<BugType> &BT);
     53 
     54   static void emitBadCall(BugType *BT, CheckerContext &C, const Expr *BadE);
     55   void emitNilReceiverBug(CheckerContext &C, const ObjCMethodCall &msg,
     56                           ExplodedNode *N) const;
     57 
     58   void HandleNilReceiver(CheckerContext &C,
     59                          ProgramStateRef state,
     60                          const ObjCMethodCall &msg) const;
     61 
     62   static void LazyInit_BT(const char *desc, OwningPtr<BugType> &BT) {
     63     if (!BT)
     64       BT.reset(new BuiltinBug(desc));
     65   }
     66 };
     67 } // end anonymous namespace
     68 
     69 void CallAndMessageChecker::emitBadCall(BugType *BT, CheckerContext &C,
     70                                         const Expr *BadE) {
     71   ExplodedNode *N = C.generateSink();
     72   if (!N)
     73     return;
     74 
     75   BugReport *R = new BugReport(*BT, BT->getName(), N);
     76   if (BadE) {
     77     R->addRange(BadE->getSourceRange());
     78     bugreporter::trackNullOrUndefValue(N, BadE, *R);
     79   }
     80   C.EmitReport(R);
     81 }
     82 
     83 static StringRef describeUninitializedArgumentInCall(const CallEvent &Call,
     84                                                      bool IsFirstArgument) {
     85   switch (Call.getKind()) {
     86   case CE_ObjCMessage: {
     87     const ObjCMethodCall &Msg = cast<ObjCMethodCall>(Call);
     88     switch (Msg.getMessageKind()) {
     89     case OCM_Message:
     90       return "Argument in message expression is an uninitialized value";
     91     case OCM_PropertyAccess:
     92       assert(Msg.isSetter() && "Getters have no args");
     93       return "Argument for property setter is an uninitialized value";
     94     case OCM_Subscript:
     95       if (Msg.isSetter() && IsFirstArgument)
     96         return "Argument for subscript setter is an uninitialized value";
     97       return "Subscript index is an uninitialized value";
     98     }
     99     llvm_unreachable("Unknown message kind.");
    100   }
    101   case CE_Block:
    102     return "Block call argument is an uninitialized value";
    103   default:
    104     return "Function call argument is an uninitialized value";
    105   }
    106 }
    107 
    108 bool CallAndMessageChecker::PreVisitProcessArg(CheckerContext &C,
    109                                                SVal V, SourceRange argRange,
    110                                                const Expr *argEx,
    111                                                bool IsFirstArgument,
    112                                                bool checkUninitFields,
    113                                                const CallEvent &Call,
    114                                                OwningPtr<BugType> &BT) {
    115   if (V.isUndef()) {
    116     if (ExplodedNode *N = C.generateSink()) {
    117       LazyInit_BT("Uninitialized argument value", BT);
    118 
    119       // Generate a report for this bug.
    120       StringRef Desc = describeUninitializedArgumentInCall(Call,
    121                                                            IsFirstArgument);
    122       BugReport *R = new BugReport(*BT, Desc, N);
    123       R->addRange(argRange);
    124       if (argEx)
    125         bugreporter::trackNullOrUndefValue(N, argEx, *R);
    126       C.EmitReport(R);
    127     }
    128     return true;
    129   }
    130 
    131   if (!checkUninitFields)
    132     return false;
    133 
    134   if (const nonloc::LazyCompoundVal *LV =
    135         dyn_cast<nonloc::LazyCompoundVal>(&V)) {
    136 
    137     class FindUninitializedField {
    138     public:
    139       SmallVector<const FieldDecl *, 10> FieldChain;
    140     private:
    141       StoreManager &StoreMgr;
    142       MemRegionManager &MrMgr;
    143       Store store;
    144     public:
    145       FindUninitializedField(StoreManager &storeMgr,
    146                              MemRegionManager &mrMgr, Store s)
    147       : StoreMgr(storeMgr), MrMgr(mrMgr), store(s) {}
    148 
    149       bool Find(const TypedValueRegion *R) {
    150         QualType T = R->getValueType();
    151         if (const RecordType *RT = T->getAsStructureType()) {
    152           const RecordDecl *RD = RT->getDecl()->getDefinition();
    153           assert(RD && "Referred record has no definition");
    154           for (RecordDecl::field_iterator I =
    155                RD->field_begin(), E = RD->field_end(); I!=E; ++I) {
    156             const FieldRegion *FR = MrMgr.getFieldRegion(*I, R);
    157             FieldChain.push_back(*I);
    158             T = I->getType();
    159             if (T->getAsStructureType()) {
    160               if (Find(FR))
    161                 return true;
    162             }
    163             else {
    164               const SVal &V = StoreMgr.getBinding(store, loc::MemRegionVal(FR));
    165               if (V.isUndef())
    166                 return true;
    167             }
    168             FieldChain.pop_back();
    169           }
    170         }
    171 
    172         return false;
    173       }
    174     };
    175 
    176     const LazyCompoundValData *D = LV->getCVData();
    177     FindUninitializedField F(C.getState()->getStateManager().getStoreManager(),
    178                              C.getSValBuilder().getRegionManager(),
    179                              D->getStore());
    180 
    181     if (F.Find(D->getRegion())) {
    182       if (ExplodedNode *N = C.generateSink()) {
    183         LazyInit_BT("Uninitialized argument value", BT);
    184         SmallString<512> Str;
    185         llvm::raw_svector_ostream os(Str);
    186         os << "Passed-by-value struct argument contains uninitialized data";
    187 
    188         if (F.FieldChain.size() == 1)
    189           os << " (e.g., field: '" << *F.FieldChain[0] << "')";
    190         else {
    191           os << " (e.g., via the field chain: '";
    192           bool first = true;
    193           for (SmallVectorImpl<const FieldDecl *>::iterator
    194                DI = F.FieldChain.begin(), DE = F.FieldChain.end(); DI!=DE;++DI){
    195             if (first)
    196               first = false;
    197             else
    198               os << '.';
    199             os << **DI;
    200           }
    201           os << "')";
    202         }
    203 
    204         // Generate a report for this bug.
    205         BugReport *R = new BugReport(*BT, os.str(), N);
    206         R->addRange(argRange);
    207 
    208         // FIXME: enhance track back for uninitialized value for arbitrary
    209         // memregions
    210         C.EmitReport(R);
    211       }
    212       return true;
    213     }
    214   }
    215 
    216   return false;
    217 }
    218 
    219 void CallAndMessageChecker::checkPreStmt(const CallExpr *CE,
    220                                          CheckerContext &C) const{
    221 
    222   const Expr *Callee = CE->getCallee()->IgnoreParens();
    223   ProgramStateRef State = C.getState();
    224   const LocationContext *LCtx = C.getLocationContext();
    225   SVal L = State->getSVal(Callee, LCtx);
    226 
    227   if (L.isUndef()) {
    228     if (!BT_call_undef)
    229       BT_call_undef.reset(new BuiltinBug("Called function pointer is an "
    230                                          "uninitalized pointer value"));
    231     emitBadCall(BT_call_undef.get(), C, Callee);
    232     return;
    233   }
    234 
    235   ProgramStateRef StNonNull, StNull;
    236   llvm::tie(StNonNull, StNull) = State->assume(cast<DefinedOrUnknownSVal>(L));
    237 
    238   if (StNull && !StNonNull) {
    239     if (!BT_call_null)
    240       BT_call_null.reset(
    241         new BuiltinBug("Called function pointer is null (null dereference)"));
    242     emitBadCall(BT_call_null.get(), C, Callee);
    243   }
    244 
    245   C.addTransition(StNonNull);
    246 }
    247 
    248 void CallAndMessageChecker::checkPreCall(const CallEvent &Call,
    249                                          CheckerContext &C) const {
    250   ProgramStateRef State = C.getState();
    251 
    252   // If this is a call to a C++ method, check if the callee is null or
    253   // undefined.
    254   if (const CXXInstanceCall *CC = dyn_cast<CXXInstanceCall>(&Call)) {
    255     SVal V = CC->getCXXThisVal();
    256     if (V.isUndef()) {
    257       if (!BT_cxx_call_undef)
    258         BT_cxx_call_undef.reset(new BuiltinBug("Called C++ object pointer is "
    259                                                "uninitialized"));
    260       emitBadCall(BT_cxx_call_undef.get(), C, CC->getCXXThisExpr());
    261       return;
    262     }
    263 
    264     ProgramStateRef StNonNull, StNull;
    265     llvm::tie(StNonNull, StNull) = State->assume(cast<DefinedOrUnknownSVal>(V));
    266 
    267     if (StNull && !StNonNull) {
    268       if (!BT_cxx_call_null)
    269         BT_cxx_call_null.reset(new BuiltinBug("Called C++ object pointer "
    270                                               "is null"));
    271       emitBadCall(BT_cxx_call_null.get(), C, CC->getCXXThisExpr());
    272       return;
    273     }
    274 
    275     State = StNonNull;
    276   }
    277 
    278   // Don't check for uninitialized field values in arguments if the
    279   // caller has a body that is available and we have the chance to inline it.
    280   // This is a hack, but is a reasonable compromise betweens sometimes warning
    281   // and sometimes not depending on if we decide to inline a function.
    282   const Decl *D = Call.getDecl();
    283   const bool checkUninitFields =
    284     !(C.getAnalysisManager().shouldInlineCall() && (D && D->getBody()));
    285 
    286   OwningPtr<BugType> *BT;
    287   if (isa<ObjCMethodCall>(Call))
    288     BT = &BT_msg_arg;
    289   else
    290     BT = &BT_call_arg;
    291 
    292   for (unsigned i = 0, e = Call.getNumArgs(); i != e; ++i)
    293     if (PreVisitProcessArg(C, Call.getArgSVal(i), Call.getArgSourceRange(i),
    294                            Call.getArgExpr(i), /*IsFirstArgument=*/i == 0,
    295                            checkUninitFields, Call, *BT))
    296       return;
    297 
    298   // If we make it here, record our assumptions about the callee.
    299   C.addTransition(State);
    300 }
    301 
    302 void CallAndMessageChecker::checkPreObjCMessage(const ObjCMethodCall &msg,
    303                                                 CheckerContext &C) const {
    304   SVal recVal = msg.getReceiverSVal();
    305   if (recVal.isUndef()) {
    306     if (ExplodedNode *N = C.generateSink()) {
    307       BugType *BT = 0;
    308       switch (msg.getMessageKind()) {
    309       case OCM_Message:
    310         if (!BT_msg_undef)
    311           BT_msg_undef.reset(new BuiltinBug("Receiver in message expression "
    312                                             "is an uninitialized value"));
    313         BT = BT_msg_undef.get();
    314         break;
    315       case OCM_PropertyAccess:
    316         if (!BT_objc_prop_undef)
    317           BT_objc_prop_undef.reset(new BuiltinBug("Property access on an "
    318                                                   "uninitialized object "
    319                                                   "pointer"));
    320         BT = BT_objc_prop_undef.get();
    321         break;
    322       case OCM_Subscript:
    323         if (!BT_objc_subscript_undef)
    324           BT_objc_subscript_undef.reset(new BuiltinBug("Subscript access on an "
    325                                                        "uninitialized object "
    326                                                        "pointer"));
    327         BT = BT_objc_subscript_undef.get();
    328         break;
    329       }
    330       assert(BT && "Unknown message kind.");
    331 
    332       BugReport *R = new BugReport(*BT, BT->getName(), N);
    333       const ObjCMessageExpr *ME = msg.getOriginExpr();
    334       R->addRange(ME->getReceiverRange());
    335 
    336       // FIXME: getTrackNullOrUndefValueVisitor can't handle "super" yet.
    337       if (const Expr *ReceiverE = ME->getInstanceReceiver())
    338         bugreporter::trackNullOrUndefValue(N, ReceiverE, *R);
    339       C.EmitReport(R);
    340     }
    341     return;
    342   } else {
    343     // Bifurcate the state into nil and non-nil ones.
    344     DefinedOrUnknownSVal receiverVal = cast<DefinedOrUnknownSVal>(recVal);
    345 
    346     ProgramStateRef state = C.getState();
    347     ProgramStateRef notNilState, nilState;
    348     llvm::tie(notNilState, nilState) = state->assume(receiverVal);
    349 
    350     // Handle receiver must be nil.
    351     if (nilState && !notNilState) {
    352       HandleNilReceiver(C, state, msg);
    353       return;
    354     }
    355   }
    356 }
    357 
    358 void CallAndMessageChecker::emitNilReceiverBug(CheckerContext &C,
    359                                                const ObjCMethodCall &msg,
    360                                                ExplodedNode *N) const {
    361 
    362   if (!BT_msg_ret)
    363     BT_msg_ret.reset(
    364       new BuiltinBug("Receiver in message expression is "
    365                      "'nil' and returns a garbage value"));
    366 
    367   const ObjCMessageExpr *ME = msg.getOriginExpr();
    368 
    369   SmallString<200> buf;
    370   llvm::raw_svector_ostream os(buf);
    371   os << "The receiver of message '" << ME->getSelector().getAsString()
    372      << "' is nil and returns a value of type '";
    373   msg.getResultType().print(os, C.getLangOpts());
    374   os << "' that will be garbage";
    375 
    376   BugReport *report = new BugReport(*BT_msg_ret, os.str(), N);
    377   report->addRange(ME->getReceiverRange());
    378   // FIXME: This won't track "self" in messages to super.
    379   if (const Expr *receiver = ME->getInstanceReceiver()) {
    380     bugreporter::trackNullOrUndefValue(N, receiver, *report);
    381   }
    382   C.EmitReport(report);
    383 }
    384 
    385 static bool supportsNilWithFloatRet(const llvm::Triple &triple) {
    386   return (triple.getVendor() == llvm::Triple::Apple &&
    387           (triple.getOS() == llvm::Triple::IOS ||
    388            !triple.isMacOSXVersionLT(10,5)));
    389 }
    390 
    391 void CallAndMessageChecker::HandleNilReceiver(CheckerContext &C,
    392                                               ProgramStateRef state,
    393                                               const ObjCMethodCall &Msg) const {
    394   ASTContext &Ctx = C.getASTContext();
    395 
    396   // Check the return type of the message expression.  A message to nil will
    397   // return different values depending on the return type and the architecture.
    398   QualType RetTy = Msg.getResultType();
    399   CanQualType CanRetTy = Ctx.getCanonicalType(RetTy);
    400   const LocationContext *LCtx = C.getLocationContext();
    401 
    402   if (CanRetTy->isStructureOrClassType()) {
    403     // Structure returns are safe since the compiler zeroes them out.
    404     SVal V = C.getSValBuilder().makeZeroVal(RetTy);
    405     C.addTransition(state->BindExpr(Msg.getOriginExpr(), LCtx, V));
    406     return;
    407   }
    408 
    409   // Other cases: check if sizeof(return type) > sizeof(void*)
    410   if (CanRetTy != Ctx.VoidTy && C.getLocationContext()->getParentMap()
    411                                   .isConsumedExpr(Msg.getOriginExpr())) {
    412     // Compute: sizeof(void *) and sizeof(return type)
    413     const uint64_t voidPtrSize = Ctx.getTypeSize(Ctx.VoidPtrTy);
    414     const uint64_t returnTypeSize = Ctx.getTypeSize(CanRetTy);
    415 
    416     if (voidPtrSize < returnTypeSize &&
    417         !(supportsNilWithFloatRet(Ctx.getTargetInfo().getTriple()) &&
    418           (Ctx.FloatTy == CanRetTy ||
    419            Ctx.DoubleTy == CanRetTy ||
    420            Ctx.LongDoubleTy == CanRetTy ||
    421            Ctx.LongLongTy == CanRetTy ||
    422            Ctx.UnsignedLongLongTy == CanRetTy))) {
    423       if (ExplodedNode *N = C.generateSink(state))
    424         emitNilReceiverBug(C, Msg, N);
    425       return;
    426     }
    427 
    428     // Handle the safe cases where the return value is 0 if the
    429     // receiver is nil.
    430     //
    431     // FIXME: For now take the conservative approach that we only
    432     // return null values if we *know* that the receiver is nil.
    433     // This is because we can have surprises like:
    434     //
    435     //   ... = [[NSScreens screens] objectAtIndex:0];
    436     //
    437     // What can happen is that [... screens] could return nil, but
    438     // it most likely isn't nil.  We should assume the semantics
    439     // of this case unless we have *a lot* more knowledge.
    440     //
    441     SVal V = C.getSValBuilder().makeZeroVal(RetTy);
    442     C.addTransition(state->BindExpr(Msg.getOriginExpr(), LCtx, V));
    443     return;
    444   }
    445 
    446   C.addTransition(state);
    447 }
    448 
    449 void ento::registerCallAndMessageChecker(CheckerManager &mgr) {
    450   mgr.registerChecker<CallAndMessageChecker>();
    451 }
    452