Home | History | Annotate | Download | only in Expression
      1 //===-- IRDynamicChecks.cpp -------------------------------------------*- C++ -*-===//
      2 //
      3 //                     The LLVM Compiler Infrastructure
      4 //
      5 // This file is distributed under the University of Illinois Open Source
      6 // License. See LICENSE.TXT for details.
      7 //
      8 //===----------------------------------------------------------------------===//
      9 
     10 #include "lldb/Expression/IRDynamicChecks.h"
     11 
     12 #include "lldb/Core/ConstString.h"
     13 #include "lldb/Core/Log.h"
     14 #include "lldb/Expression/ClangUtilityFunction.h"
     15 #include "lldb/Target/ExecutionContext.h"
     16 #include "lldb/Target/ObjCLanguageRuntime.h"
     17 #include "lldb/Target/Process.h"
     18 #include "lldb/Target/StackFrame.h"
     19 
     20 #include "llvm/Support/raw_ostream.h"
     21 #include "llvm/IR/Constants.h"
     22 #include "llvm/IR/Function.h"
     23 #include "llvm/IR/Instructions.h"
     24 #include "llvm/IR/Module.h"
     25 #include "llvm/IR/Value.h"
     26 
     27 using namespace llvm;
     28 using namespace lldb_private;
     29 
     30 static char ID;
     31 
     32 #define VALID_POINTER_CHECK_NAME "$__lldb_valid_pointer_check"
     33 #define VALID_OBJC_OBJECT_CHECK_NAME "$__lldb_objc_object_check"
     34 
     35 static const char g_valid_pointer_check_text[] =
     36 "extern \"C\" void\n"
     37 "$__lldb_valid_pointer_check (unsigned char *$__lldb_arg_ptr)\n"
     38 "{\n"
     39 "    unsigned char $__lldb_local_val = *$__lldb_arg_ptr;\n"
     40 "}";
     41 
     42 DynamicCheckerFunctions::DynamicCheckerFunctions ()
     43 {
     44 }
     45 
     46 DynamicCheckerFunctions::~DynamicCheckerFunctions ()
     47 {
     48 }
     49 
     50 bool
     51 DynamicCheckerFunctions::Install(Stream &error_stream,
     52                                  ExecutionContext &exe_ctx)
     53 {
     54     m_valid_pointer_check.reset(new ClangUtilityFunction(g_valid_pointer_check_text,
     55                                                          VALID_POINTER_CHECK_NAME));
     56     if (!m_valid_pointer_check->Install(error_stream, exe_ctx))
     57         return false;
     58 
     59     Process *process = exe_ctx.GetProcessPtr();
     60 
     61     if (process)
     62     {
     63         ObjCLanguageRuntime *objc_language_runtime = process->GetObjCLanguageRuntime();
     64 
     65         if (objc_language_runtime)
     66         {
     67             m_objc_object_check.reset(objc_language_runtime->CreateObjectChecker(VALID_OBJC_OBJECT_CHECK_NAME));
     68 
     69             if (!m_objc_object_check->Install(error_stream, exe_ctx))
     70                 return false;
     71         }
     72     }
     73 
     74     return true;
     75 }
     76 
     77 bool
     78 DynamicCheckerFunctions::DoCheckersExplainStop (lldb::addr_t addr, Stream &message)
     79 {
     80     // FIXME: We have to get the checkers to know why they scotched the call in more detail,
     81     // so we can print a better message here.
     82     if (m_valid_pointer_check.get() != NULL && m_valid_pointer_check->ContainsAddress(addr))
     83     {
     84         message.Printf ("Attempted to dereference an invalid pointer.");
     85         return true;
     86     }
     87     else if (m_objc_object_check.get() != NULL && m_objc_object_check->ContainsAddress(addr))
     88     {
     89         message.Printf ("Attempted to dereference an invalid ObjC Object or send it an unrecognized selector");
     90         return true;
     91     }
     92     return false;
     93 }
     94 
     95 
     96 static std::string
     97 PrintValue(llvm::Value *V, bool truncate = false)
     98 {
     99     std::string s;
    100     raw_string_ostream rso(s);
    101     V->print(rso);
    102     rso.flush();
    103     if (truncate)
    104         s.resize(s.length() - 1);
    105     return s;
    106 }
    107 
    108 //----------------------------------------------------------------------
    109 /// @class Instrumenter IRDynamicChecks.cpp
    110 /// @brief Finds and instruments individual LLVM IR instructions
    111 ///
    112 /// When instrumenting LLVM IR, it is frequently desirable to first search
    113 /// for instructions, and then later modify them.  This way iterators
    114 /// remain intact, and multiple passes can look at the same code base without
    115 /// treading on each other's toes.
    116 ///
    117 /// The Instrumenter class implements this functionality.  A client first
    118 /// calls Inspect on a function, which populates a list of instructions to
    119 /// be instrumented.  Then, later, when all passes' Inspect functions have
    120 /// been called, the client calls Instrument, which adds the desired
    121 /// instrumentation.
    122 ///
    123 /// A subclass of Instrumenter must override InstrumentInstruction, which
    124 /// is responsible for adding whatever instrumentation is necessary.
    125 ///
    126 /// A subclass of Instrumenter may override:
    127 ///
    128 /// - InspectInstruction [default: does nothing]
    129 ///
    130 /// - InspectBasicBlock [default: iterates through the instructions in a
    131 ///   basic block calling InspectInstruction]
    132 ///
    133 /// - InspectFunction [default: iterates through the basic blocks in a
    134 ///   function calling InspectBasicBlock]
    135 //----------------------------------------------------------------------
    136 class Instrumenter {
    137 public:
    138     //------------------------------------------------------------------
    139     /// Constructor
    140     ///
    141     /// @param[in] module
    142     ///     The module being instrumented.
    143     //------------------------------------------------------------------
    144     Instrumenter (llvm::Module &module,
    145                   DynamicCheckerFunctions &checker_functions) :
    146         m_module(module),
    147         m_checker_functions(checker_functions),
    148         m_i8ptr_ty(NULL)
    149     {
    150     }
    151 
    152     virtual~Instrumenter ()
    153     {
    154     }
    155 
    156     //------------------------------------------------------------------
    157     /// Inspect a function to find instructions to instrument
    158     ///
    159     /// @param[in] function
    160     ///     The function to inspect.
    161     ///
    162     /// @return
    163     ///     True on success; false on error.
    164     //------------------------------------------------------------------
    165     bool Inspect (llvm::Function &function)
    166     {
    167         return InspectFunction(function);
    168     }
    169 
    170     //------------------------------------------------------------------
    171     /// Instrument all the instructions found by Inspect()
    172     ///
    173     /// @return
    174     ///     True on success; false on error.
    175     //------------------------------------------------------------------
    176     bool Instrument ()
    177     {
    178         for (InstIterator ii = m_to_instrument.begin(), last_ii = m_to_instrument.end();
    179              ii != last_ii;
    180              ++ii)
    181         {
    182             if (!InstrumentInstruction(*ii))
    183                 return false;
    184         }
    185 
    186         return true;
    187     }
    188 protected:
    189     //------------------------------------------------------------------
    190     /// Add instrumentation to a single instruction
    191     ///
    192     /// @param[in] inst
    193     ///     The instruction to be instrumented.
    194     ///
    195     /// @return
    196     ///     True on success; false otherwise.
    197     //------------------------------------------------------------------
    198     virtual bool InstrumentInstruction(llvm::Instruction *inst) = 0;
    199 
    200     //------------------------------------------------------------------
    201     /// Register a single instruction to be instrumented
    202     ///
    203     /// @param[in] inst
    204     ///     The instruction to be instrumented.
    205     //------------------------------------------------------------------
    206     void RegisterInstruction(llvm::Instruction &i)
    207     {
    208         m_to_instrument.push_back(&i);
    209     }
    210 
    211     //------------------------------------------------------------------
    212     /// Determine whether a single instruction is interesting to
    213     /// instrument, and, if so, call RegisterInstruction
    214     ///
    215     /// @param[in] i
    216     ///     The instruction to be inspected.
    217     ///
    218     /// @return
    219     ///     False if there was an error scanning; true otherwise.
    220     //------------------------------------------------------------------
    221     virtual bool InspectInstruction(llvm::Instruction &i)
    222     {
    223         return true;
    224     }
    225 
    226     //------------------------------------------------------------------
    227     /// Scan a basic block to see if any instructions are interesting
    228     ///
    229     /// @param[in] bb
    230     ///     The basic block to be inspected.
    231     ///
    232     /// @return
    233     ///     False if there was an error scanning; true otherwise.
    234     //------------------------------------------------------------------
    235     virtual bool InspectBasicBlock(llvm::BasicBlock &bb)
    236     {
    237         for (llvm::BasicBlock::iterator ii = bb.begin(), last_ii = bb.end();
    238              ii != last_ii;
    239              ++ii)
    240         {
    241             if (!InspectInstruction(*ii))
    242                 return false;
    243         }
    244 
    245         return true;
    246     }
    247 
    248     //------------------------------------------------------------------
    249     /// Scan a function to see if any instructions are interesting
    250     ///
    251     /// @param[in] f
    252     ///     The function to be inspected.
    253     ///
    254     /// @return
    255     ///     False if there was an error scanning; true otherwise.
    256     //------------------------------------------------------------------
    257     virtual bool InspectFunction(llvm::Function &f)
    258     {
    259         for (llvm::Function::iterator bbi = f.begin(), last_bbi = f.end();
    260              bbi != last_bbi;
    261              ++bbi)
    262         {
    263             if (!InspectBasicBlock(*bbi))
    264                 return false;
    265         }
    266 
    267         return true;
    268     }
    269 
    270     //------------------------------------------------------------------
    271     /// Build a function pointer for a function with signature
    272     /// void (*)(uint8_t*) with a given address
    273     ///
    274     /// @param[in] start_address
    275     ///     The address of the function.
    276     ///
    277     /// @return
    278     ///     The function pointer, for use in a CallInst.
    279     //------------------------------------------------------------------
    280     llvm::Value *BuildPointerValidatorFunc(lldb::addr_t start_address)
    281     {
    282         IntegerType *intptr_ty = llvm::Type::getIntNTy(m_module.getContext(),
    283                                                              (m_module.getPointerSize() == llvm::Module::Pointer64) ? 64 : 32);
    284 
    285         llvm::Type *param_array[1];
    286 
    287         param_array[0] = const_cast<llvm::PointerType*>(GetI8PtrTy());
    288 
    289         ArrayRef<llvm::Type*> params(param_array, 1);
    290 
    291         FunctionType *fun_ty = FunctionType::get(llvm::Type::getVoidTy(m_module.getContext()), params, true);
    292         PointerType *fun_ptr_ty = PointerType::getUnqual(fun_ty);
    293         Constant *fun_addr_int = ConstantInt::get(intptr_ty, start_address, false);
    294         return ConstantExpr::getIntToPtr(fun_addr_int, fun_ptr_ty);
    295     }
    296 
    297     //------------------------------------------------------------------
    298     /// Build a function pointer for a function with signature
    299     /// void (*)(uint8_t*, uint8_t*) with a given address
    300     ///
    301     /// @param[in] start_address
    302     ///     The address of the function.
    303     ///
    304     /// @return
    305     ///     The function pointer, for use in a CallInst.
    306     //------------------------------------------------------------------
    307     llvm::Value *BuildObjectCheckerFunc(lldb::addr_t start_address)
    308     {
    309         IntegerType *intptr_ty = llvm::Type::getIntNTy(m_module.getContext(),
    310                                                        (m_module.getPointerSize() == llvm::Module::Pointer64) ? 64 : 32);
    311 
    312         llvm::Type *param_array[2];
    313 
    314         param_array[0] = const_cast<llvm::PointerType*>(GetI8PtrTy());
    315         param_array[1] = const_cast<llvm::PointerType*>(GetI8PtrTy());
    316 
    317         ArrayRef<llvm::Type*> params(param_array, 2);
    318 
    319         FunctionType *fun_ty = FunctionType::get(llvm::Type::getVoidTy(m_module.getContext()), params, true);
    320         PointerType *fun_ptr_ty = PointerType::getUnqual(fun_ty);
    321         Constant *fun_addr_int = ConstantInt::get(intptr_ty, start_address, false);
    322         return ConstantExpr::getIntToPtr(fun_addr_int, fun_ptr_ty);
    323     }
    324 
    325     PointerType *GetI8PtrTy()
    326     {
    327         if (!m_i8ptr_ty)
    328             m_i8ptr_ty = llvm::Type::getInt8PtrTy(m_module.getContext());
    329 
    330         return m_i8ptr_ty;
    331     }
    332 
    333     typedef std::vector <llvm::Instruction *>   InstVector;
    334     typedef InstVector::iterator                InstIterator;
    335 
    336     InstVector                  m_to_instrument;        ///< List of instructions the inspector found
    337     llvm::Module               &m_module;               ///< The module which is being instrumented
    338     DynamicCheckerFunctions    &m_checker_functions;    ///< The dynamic checker functions for the process
    339 private:
    340     PointerType                *m_i8ptr_ty;
    341 };
    342 
    343 class ValidPointerChecker : public Instrumenter
    344 {
    345 public:
    346     ValidPointerChecker (llvm::Module &module,
    347                          DynamicCheckerFunctions &checker_functions) :
    348         Instrumenter(module, checker_functions),
    349         m_valid_pointer_check_func(NULL)
    350     {
    351     }
    352 
    353     virtual ~ValidPointerChecker ()
    354     {
    355     }
    356 private:
    357     bool InstrumentInstruction(llvm::Instruction *inst)
    358     {
    359         Log *log(lldb_private::GetLogIfAllCategoriesSet (LIBLLDB_LOG_EXPRESSIONS));
    360 
    361         if (log)
    362             log->Printf("Instrumenting load/store instruction: %s\n",
    363                         PrintValue(inst).c_str());
    364 
    365         if (!m_valid_pointer_check_func)
    366             m_valid_pointer_check_func = BuildPointerValidatorFunc(m_checker_functions.m_valid_pointer_check->StartAddress());
    367 
    368         llvm::Value *dereferenced_ptr = NULL;
    369 
    370         if (llvm::LoadInst *li = dyn_cast<llvm::LoadInst> (inst))
    371             dereferenced_ptr = li->getPointerOperand();
    372         else if (llvm::StoreInst *si = dyn_cast<llvm::StoreInst> (inst))
    373             dereferenced_ptr = si->getPointerOperand();
    374         else
    375             return false;
    376 
    377         // Insert an instruction to cast the loaded value to int8_t*
    378 
    379         BitCastInst *bit_cast = new BitCastInst(dereferenced_ptr,
    380                                                 GetI8PtrTy(),
    381                                                 "",
    382                                                 inst);
    383 
    384         // Insert an instruction to call the helper with the result
    385 
    386         llvm::Value *arg_array[1];
    387 
    388         arg_array[0] = bit_cast;
    389 
    390         llvm::ArrayRef<llvm::Value *> args(arg_array, 1);
    391 
    392         CallInst::Create(m_valid_pointer_check_func,
    393                          args,
    394                          "",
    395                          inst);
    396 
    397         return true;
    398     }
    399 
    400     bool InspectInstruction(llvm::Instruction &i)
    401     {
    402         if (dyn_cast<llvm::LoadInst> (&i) ||
    403             dyn_cast<llvm::StoreInst> (&i))
    404             RegisterInstruction(i);
    405 
    406         return true;
    407     }
    408 
    409     llvm::Value         *m_valid_pointer_check_func;
    410 };
    411 
    412 class ObjcObjectChecker : public Instrumenter
    413 {
    414 public:
    415     ObjcObjectChecker(llvm::Module &module,
    416                         DynamicCheckerFunctions &checker_functions) :
    417         Instrumenter(module, checker_functions),
    418         m_objc_object_check_func(NULL)
    419     {
    420     }
    421 
    422     virtual
    423     ~ObjcObjectChecker ()
    424     {
    425     }
    426 
    427     enum msgSend_type
    428     {
    429         eMsgSend = 0,
    430         eMsgSendSuper,
    431         eMsgSendSuper_stret,
    432         eMsgSend_fpret,
    433         eMsgSend_stret
    434     };
    435 
    436     std::map <llvm::Instruction *, msgSend_type> msgSend_types;
    437 
    438 private:
    439     bool InstrumentInstruction(llvm::Instruction *inst)
    440     {
    441         CallInst *call_inst = dyn_cast<CallInst>(inst);
    442 
    443         if (!call_inst)
    444             return false; // call_inst really shouldn't be NULL, because otherwise InspectInstruction wouldn't have registered it
    445 
    446         if (!m_objc_object_check_func)
    447             m_objc_object_check_func = BuildObjectCheckerFunc(m_checker_functions.m_objc_object_check->StartAddress());
    448 
    449         // id objc_msgSend(id theReceiver, SEL theSelector, ...)
    450 
    451         llvm::Value *target_object;
    452         llvm::Value *selector;
    453 
    454         switch (msgSend_types[inst])
    455         {
    456         case eMsgSend:
    457         case eMsgSend_fpret:
    458             target_object = call_inst->getArgOperand(0);
    459             selector = call_inst->getArgOperand(1);
    460             break;
    461         case eMsgSend_stret:
    462             target_object = call_inst->getArgOperand(1);
    463             selector = call_inst->getArgOperand(2);
    464             break;
    465         case eMsgSendSuper:
    466         case eMsgSendSuper_stret:
    467             return true;
    468         }
    469 
    470         // These objects should always be valid according to Sean Calannan
    471         assert (target_object);
    472         assert (selector);
    473 
    474         // Insert an instruction to cast the receiver id to int8_t*
    475 
    476         BitCastInst *bit_cast = new BitCastInst(target_object,
    477                                                 GetI8PtrTy(),
    478                                                 "",
    479                                                 inst);
    480 
    481         // Insert an instruction to call the helper with the result
    482 
    483         llvm::Value *arg_array[2];
    484 
    485         arg_array[0] = bit_cast;
    486         arg_array[1] = selector;
    487 
    488         ArrayRef<llvm::Value*> args(arg_array, 2);
    489 
    490         CallInst::Create(m_objc_object_check_func,
    491                          args,
    492                          "",
    493                          inst);
    494 
    495         return true;
    496     }
    497 
    498     bool InspectInstruction(llvm::Instruction &i)
    499     {
    500         Log *log(lldb_private::GetLogIfAllCategoriesSet (LIBLLDB_LOG_EXPRESSIONS));
    501 
    502         CallInst *call_inst = dyn_cast<CallInst>(&i);
    503 
    504         if (call_inst)
    505         {
    506             // This metadata is set by IRForTarget::MaybeHandleCall().
    507 
    508             MDNode *metadata = call_inst->getMetadata("lldb.call.realName");
    509 
    510             if (!metadata)
    511                 return true;
    512 
    513             if (metadata->getNumOperands() != 1)
    514             {
    515                 if (log)
    516                     log->Printf("Function call metadata has %d operands for [%p] %s", metadata->getNumOperands(), call_inst, PrintValue(call_inst).c_str());
    517                 return false;
    518             }
    519 
    520             MDString *real_name = dyn_cast<MDString>(metadata->getOperand(0));
    521 
    522             if (!real_name)
    523             {
    524                 if (log)
    525                     log->Printf("Function call metadata is not an MDString for [%p] %s", call_inst, PrintValue(call_inst).c_str());
    526                 return false;
    527             }
    528 
    529             std::string name_str = real_name->getString();
    530             const char* name_cstr = name_str.c_str();
    531 
    532             if (log)
    533                 log->Printf("Found call to %s: %s\n", name_cstr, PrintValue(call_inst).c_str());
    534 
    535             if (name_str.find("objc_msgSend") == std::string::npos)
    536                 return true;
    537 
    538             if (!strcmp(name_cstr, "objc_msgSend"))
    539             {
    540                 RegisterInstruction(i);
    541                 msgSend_types[&i] = eMsgSend;
    542                 return true;
    543             }
    544 
    545             if (!strcmp(name_cstr, "objc_msgSend_stret"))
    546             {
    547                 RegisterInstruction(i);
    548                 msgSend_types[&i] = eMsgSend_stret;
    549                 return true;
    550             }
    551 
    552             if (!strcmp(name_cstr, "objc_msgSend_fpret"))
    553             {
    554                 RegisterInstruction(i);
    555                 msgSend_types[&i] = eMsgSend_fpret;
    556                 return true;
    557             }
    558 
    559             if (!strcmp(name_cstr, "objc_msgSendSuper"))
    560             {
    561                 RegisterInstruction(i);
    562                 msgSend_types[&i] = eMsgSendSuper;
    563                 return true;
    564             }
    565 
    566             if (!strcmp(name_cstr, "objc_msgSendSuper_stret"))
    567             {
    568                 RegisterInstruction(i);
    569                 msgSend_types[&i] = eMsgSendSuper_stret;
    570                 return true;
    571             }
    572 
    573             if (log)
    574                 log->Printf("Function name '%s' contains 'objc_msgSend' but is not handled", name_str.c_str());
    575 
    576             return true;
    577         }
    578 
    579         return true;
    580     }
    581 
    582     llvm::Value         *m_objc_object_check_func;
    583 };
    584 
    585 IRDynamicChecks::IRDynamicChecks(DynamicCheckerFunctions &checker_functions,
    586                                  const char *func_name) :
    587     ModulePass(ID),
    588     m_func_name(func_name),
    589     m_checker_functions(checker_functions)
    590 {
    591 }
    592 
    593 IRDynamicChecks::~IRDynamicChecks()
    594 {
    595 }
    596 
    597 bool
    598 IRDynamicChecks::runOnModule(llvm::Module &M)
    599 {
    600     Log *log(lldb_private::GetLogIfAllCategoriesSet (LIBLLDB_LOG_EXPRESSIONS));
    601 
    602     llvm::Function* function = M.getFunction(StringRef(m_func_name.c_str()));
    603 
    604     if (!function)
    605     {
    606         if (log)
    607             log->Printf("Couldn't find %s() in the module", m_func_name.c_str());
    608 
    609         return false;
    610     }
    611 
    612     if (m_checker_functions.m_valid_pointer_check.get())
    613     {
    614         ValidPointerChecker vpc(M, m_checker_functions);
    615 
    616         if (!vpc.Inspect(*function))
    617             return false;
    618 
    619         if (!vpc.Instrument())
    620             return false;
    621     }
    622 
    623     if (m_checker_functions.m_objc_object_check.get())
    624     {
    625         ObjcObjectChecker ooc(M, m_checker_functions);
    626 
    627         if (!ooc.Inspect(*function))
    628             return false;
    629 
    630         if (!ooc.Instrument())
    631             return false;
    632     }
    633 
    634     if (log && log->GetVerbose())
    635     {
    636         std::string s;
    637         raw_string_ostream oss(s);
    638 
    639         M.print(oss, NULL);
    640 
    641         oss.flush();
    642 
    643         log->Printf ("Module after dynamic checks: \n%s", s.c_str());
    644     }
    645 
    646     return true;
    647 }
    648 
    649 void
    650 IRDynamicChecks::assignPassManager(PMStack &PMS,
    651                                    PassManagerType T)
    652 {
    653 }
    654 
    655 PassManagerType
    656 IRDynamicChecks::getPotentialPassManagerType() const
    657 {
    658     return PMT_ModulePassManager;
    659 }
    660