Home | History | Annotate | Download | only in msan
      1 //===-- msan.cc -----------------------------------------------------------===//
      2 //
      3 //                     The LLVM Compiler Infrastructure
      4 //
      5 // This file is distributed under the University of Illinois Open Source
      6 // License. See LICENSE.TXT for details.
      7 //
      8 //===----------------------------------------------------------------------===//
      9 //
     10 // This file is a part of MemorySanitizer.
     11 //
     12 // MemorySanitizer runtime.
     13 //===----------------------------------------------------------------------===//
     14 
     15 #include "msan.h"
     16 #include "sanitizer_common/sanitizer_atomic.h"
     17 #include "sanitizer_common/sanitizer_common.h"
     18 #include "sanitizer_common/sanitizer_flags.h"
     19 #include "sanitizer_common/sanitizer_libc.h"
     20 #include "sanitizer_common/sanitizer_procmaps.h"
     21 #include "sanitizer_common/sanitizer_stacktrace.h"
     22 #include "sanitizer_common/sanitizer_symbolizer.h"
     23 
     24 #include "interception/interception.h"
     25 
     26 // ACHTUNG! No system header includes in this file.
     27 
     28 using namespace __sanitizer;
     29 
     30 // Globals.
     31 static THREADLOCAL int msan_expect_umr = 0;
     32 static THREADLOCAL int msan_expected_umr_found = 0;
     33 
     34 static int msan_running_under_dr = 0;
     35 
     36 SANITIZER_INTERFACE_ATTRIBUTE
     37 THREADLOCAL u64 __msan_param_tls[kMsanParamTlsSizeInWords];
     38 
     39 SANITIZER_INTERFACE_ATTRIBUTE
     40 THREADLOCAL u32 __msan_param_origin_tls[kMsanParamTlsSizeInWords];
     41 
     42 SANITIZER_INTERFACE_ATTRIBUTE
     43 THREADLOCAL u64 __msan_retval_tls[kMsanRetvalTlsSizeInWords];
     44 
     45 SANITIZER_INTERFACE_ATTRIBUTE
     46 THREADLOCAL u32 __msan_retval_origin_tls;
     47 
     48 SANITIZER_INTERFACE_ATTRIBUTE
     49 THREADLOCAL u64 __msan_va_arg_tls[kMsanParamTlsSizeInWords];
     50 
     51 SANITIZER_INTERFACE_ATTRIBUTE
     52 THREADLOCAL u64 __msan_va_arg_overflow_size_tls;
     53 
     54 SANITIZER_INTERFACE_ATTRIBUTE
     55 THREADLOCAL u32 __msan_origin_tls;
     56 
     57 static THREADLOCAL struct {
     58   uptr stack_top, stack_bottom;
     59 } __msan_stack_bounds;
     60 
     61 static THREADLOCAL bool is_in_symbolizer;
     62 static THREADLOCAL bool is_in_loader;
     63 
     64 extern "C" SANITIZER_WEAK_ATTRIBUTE const int __msan_track_origins;
     65 
     66 int __msan_get_track_origins() {
     67   return &__msan_track_origins ? __msan_track_origins : 0;
     68 }
     69 
     70 extern "C" SANITIZER_WEAK_ATTRIBUTE const int __msan_keep_going;
     71 
     72 namespace __msan {
     73 
     74 static bool IsRunningUnderDr() {
     75   bool result = false;
     76   MemoryMappingLayout proc_maps(/*cache_enabled*/true);
     77   const sptr kBufSize = 4095;
     78   char *filename = (char*)MmapOrDie(kBufSize, __FUNCTION__);
     79   while (proc_maps.Next(/* start */0, /* end */0, /* file_offset */0,
     80                         filename, kBufSize, /* protection */0)) {
     81     if (internal_strstr(filename, "libdynamorio") != 0) {
     82       result = true;
     83       break;
     84     }
     85   }
     86   UnmapOrDie(filename, kBufSize);
     87   return result;
     88 }
     89 
     90 void EnterSymbolizer() { is_in_symbolizer = true; }
     91 void ExitSymbolizer()  { is_in_symbolizer = false; }
     92 bool IsInSymbolizer() { return is_in_symbolizer; }
     93 
     94 void EnterLoader() { is_in_loader = true; }
     95 void ExitLoader()  { is_in_loader = false; }
     96 
     97 extern "C" {
     98 SANITIZER_INTERFACE_ATTRIBUTE
     99 bool __msan_is_in_loader() { return is_in_loader; }
    100 }
    101 
    102 static Flags msan_flags;
    103 
    104 Flags *flags() {
    105   return &msan_flags;
    106 }
    107 
    108 int msan_inited = 0;
    109 bool msan_init_is_running;
    110 
    111 int msan_report_count = 0;
    112 
    113 // Array of stack origins.
    114 // FIXME: make it resizable.
    115 static const uptr kNumStackOriginDescrs = 1024 * 1024;
    116 static const char *StackOriginDescr[kNumStackOriginDescrs];
    117 static atomic_uint32_t NumStackOriginDescrs;
    118 
    119 static void ParseFlagsFromString(Flags *f, const char *str) {
    120   ParseCommonFlagsFromString(str);
    121   ParseFlag(str, &f->poison_heap_with_zeroes, "poison_heap_with_zeroes");
    122   ParseFlag(str, &f->poison_stack_with_zeroes, "poison_stack_with_zeroes");
    123   ParseFlag(str, &f->poison_in_malloc, "poison_in_malloc");
    124   ParseFlag(str, &f->exit_code, "exit_code");
    125   if (f->exit_code < 0 || f->exit_code > 127) {
    126     Printf("Exit code not in [0, 128) range: %d\n", f->exit_code);
    127     f->exit_code = 1;
    128     Die();
    129   }
    130   ParseFlag(str, &f->report_umrs, "report_umrs");
    131   ParseFlag(str, &f->verbosity, "verbosity");
    132   ParseFlag(str, &f->wrap_signals, "wrap_signals");
    133   ParseFlag(str, &f->keep_going, "keep_going");
    134 }
    135 
    136 static void InitializeFlags(Flags *f, const char *options) {
    137   CommonFlags *cf = common_flags();
    138   cf->external_symbolizer_path = GetEnv("MSAN_SYMBOLIZER_PATH");
    139   cf->strip_path_prefix = "";
    140   cf->fast_unwind_on_fatal = false;
    141   cf->fast_unwind_on_malloc = true;
    142   cf->malloc_context_size = 20;
    143   cf->handle_ioctl = true;
    144   cf->log_path = 0;
    145 
    146   internal_memset(f, 0, sizeof(*f));
    147   f->poison_heap_with_zeroes = false;
    148   f->poison_stack_with_zeroes = false;
    149   f->poison_in_malloc = true;
    150   f->exit_code = 77;
    151   f->report_umrs = true;
    152   f->verbosity = 0;
    153   f->wrap_signals = true;
    154   f->keep_going = !!&__msan_keep_going;
    155 
    156   // Override from user-specified string.
    157   if (__msan_default_options)
    158     ParseFlagsFromString(f, __msan_default_options());
    159   ParseFlagsFromString(f, options);
    160 }
    161 
    162 static void GetCurrentStackBounds(uptr *stack_top, uptr *stack_bottom) {
    163   if (__msan_stack_bounds.stack_top == 0) {
    164     // Break recursion (GetStackTrace -> GetThreadStackTopAndBottom ->
    165     // realloc -> GetStackTrace).
    166     __msan_stack_bounds.stack_top = __msan_stack_bounds.stack_bottom = 1;
    167     GetThreadStackTopAndBottom(/* at_initialization */false,
    168                                &__msan_stack_bounds.stack_top,
    169                                &__msan_stack_bounds.stack_bottom);
    170   }
    171   *stack_top = __msan_stack_bounds.stack_top;
    172   *stack_bottom = __msan_stack_bounds.stack_bottom;
    173 }
    174 
    175 void GetStackTrace(StackTrace *stack, uptr max_s, uptr pc, uptr bp,
    176                    bool fast) {
    177   if (!fast) {
    178     // Block reports from our interceptors during _Unwind_Backtrace.
    179     SymbolizerScope sym_scope;
    180     return stack->SlowUnwindStack(pc, max_s);
    181   }
    182 
    183   uptr stack_top, stack_bottom;
    184   GetCurrentStackBounds(&stack_top, &stack_bottom);
    185   stack->size = 0;
    186   stack->trace[0] = pc;
    187   stack->max_size = max_s;
    188   stack->FastUnwindStack(pc, bp, stack_top, stack_bottom);
    189 }
    190 
    191 void PrintWarning(uptr pc, uptr bp) {
    192   PrintWarningWithOrigin(pc, bp, __msan_origin_tls);
    193 }
    194 
    195 bool OriginIsValid(u32 origin) {
    196   return origin != 0 && origin != (u32)-1;
    197 }
    198 
    199 void PrintWarningWithOrigin(uptr pc, uptr bp, u32 origin) {
    200   if (msan_expect_umr) {
    201     // Printf("Expected UMR\n");
    202     __msan_origin_tls = origin;
    203     msan_expected_umr_found = 1;
    204     return;
    205   }
    206 
    207   ++msan_report_count;
    208 
    209   StackTrace stack;
    210   GetStackTrace(&stack, kStackTraceMax, pc, bp,
    211                 common_flags()->fast_unwind_on_fatal);
    212 
    213   u32 report_origin =
    214     (__msan_get_track_origins() && OriginIsValid(origin)) ? origin : 0;
    215   ReportUMR(&stack, report_origin);
    216 
    217   if (__msan_get_track_origins() && !OriginIsValid(origin)) {
    218     Printf("  ORIGIN: invalid (%x). Might be a bug in MemorySanitizer, "
    219            "please report to MemorySanitizer developers.\n",
    220            origin);
    221   }
    222 }
    223 
    224 void UnpoisonParam(uptr n) {
    225   internal_memset(__msan_param_tls, 0, n * sizeof(*__msan_param_tls));
    226 }
    227 
    228 }  // namespace __msan
    229 
    230 // Interface.
    231 
    232 using namespace __msan;
    233 
    234 void __msan_warning() {
    235   GET_CALLER_PC_BP_SP;
    236   (void)sp;
    237   PrintWarning(pc, bp);
    238   if (!__msan::flags()->keep_going) {
    239     Printf("Exiting\n");
    240     Die();
    241   }
    242 }
    243 
    244 void __msan_warning_noreturn() {
    245   GET_CALLER_PC_BP_SP;
    246   (void)sp;
    247   PrintWarning(pc, bp);
    248   Printf("Exiting\n");
    249   Die();
    250 }
    251 
    252 void __msan_init() {
    253   if (msan_inited) return;
    254   msan_init_is_running = 1;
    255   SanitizerToolName = "MemorySanitizer";
    256 
    257   InstallAtExitHandler();
    258   SetDieCallback(MsanDie);
    259   InitTlsSize();
    260   InitializeInterceptors();
    261 
    262   if (MSAN_REPLACE_OPERATORS_NEW_AND_DELETE)
    263     ReplaceOperatorsNewAndDelete();
    264   const char *msan_options = GetEnv("MSAN_OPTIONS");
    265   InitializeFlags(&msan_flags, msan_options);
    266   __sanitizer_set_report_path(common_flags()->log_path);
    267   if (StackSizeIsUnlimited()) {
    268     if (flags()->verbosity)
    269       Printf("Unlimited stack, doing reexec\n");
    270     // A reasonably large stack size. It is bigger than the usual 8Mb, because,
    271     // well, the program could have been run with unlimited stack for a reason.
    272     SetStackSizeLimitInBytes(32 * 1024 * 1024);
    273     ReExec();
    274   }
    275 
    276   if (flags()->verbosity)
    277     Printf("MSAN_OPTIONS: %s\n", msan_options ? msan_options : "<empty>");
    278 
    279   msan_running_under_dr = IsRunningUnderDr();
    280   __msan_clear_on_return();
    281   if (__msan_get_track_origins() && flags()->verbosity > 0)
    282     Printf("msan_track_origins\n");
    283   if (!InitShadow(/* prot1 */ false, /* prot2 */ true, /* map_shadow */ true,
    284                   __msan_get_track_origins())) {
    285     // FIXME: prot1 = false is only required when running under DR.
    286     Printf("FATAL: MemorySanitizer can not mmap the shadow memory.\n");
    287     Printf("FATAL: Make sure to compile with -fPIE and to link with -pie.\n");
    288     Printf("FATAL: Disabling ASLR is known to cause this error.\n");
    289     Printf("FATAL: If running under GDB, try "
    290            "'set disable-randomization off'.\n");
    291     DumpProcessMap();
    292     Die();
    293   }
    294 
    295   const char *external_symbolizer = common_flags()->external_symbolizer_path;
    296   if (external_symbolizer && external_symbolizer[0]) {
    297     CHECK(InitializeExternalSymbolizer(external_symbolizer));
    298   }
    299 
    300   GetThreadStackTopAndBottom(/* at_initialization */true,
    301                              &__msan_stack_bounds.stack_top,
    302                              &__msan_stack_bounds.stack_bottom);
    303   if (flags()->verbosity)
    304     Printf("MemorySanitizer init done\n");
    305   msan_init_is_running = 0;
    306   msan_inited = 1;
    307 }
    308 
    309 void __msan_set_exit_code(int exit_code) {
    310   flags()->exit_code = exit_code;
    311 }
    312 
    313 void __msan_set_keep_going(int keep_going) {
    314   flags()->keep_going = keep_going;
    315 }
    316 
    317 void __msan_set_expect_umr(int expect_umr) {
    318   if (expect_umr) {
    319     msan_expected_umr_found = 0;
    320   } else if (!msan_expected_umr_found) {
    321     GET_CALLER_PC_BP_SP;
    322     (void)sp;
    323     StackTrace stack;
    324     GetStackTrace(&stack, kStackTraceMax, pc, bp,
    325                   common_flags()->fast_unwind_on_fatal);
    326     ReportExpectedUMRNotFound(&stack);
    327     Die();
    328   }
    329   msan_expect_umr = expect_umr;
    330 }
    331 
    332 void __msan_print_shadow(const void *x, uptr size) {
    333   unsigned char *s = (unsigned char*)MEM_TO_SHADOW(x);
    334   u32 *o = (u32*)MEM_TO_ORIGIN(x);
    335   for (uptr i = 0; i < size; i++) {
    336     Printf("%x%x ", s[i] >> 4, s[i] & 0xf);
    337   }
    338   Printf("\n");
    339   if (__msan_get_track_origins()) {
    340     for (uptr i = 0; i < size / 4; i++) {
    341       Printf(" o: %x ", o[i]);
    342     }
    343     Printf("\n");
    344   }
    345 }
    346 
    347 void __msan_print_param_shadow() {
    348   for (int i = 0; i < 16; i++) {
    349     Printf("#%d:%zx ", i, __msan_param_tls[i]);
    350   }
    351   Printf("\n");
    352 }
    353 
    354 sptr __msan_test_shadow(const void *x, uptr size) {
    355   unsigned char *s = (unsigned char*)MEM_TO_SHADOW((uptr)x);
    356   for (uptr i = 0; i < size; ++i)
    357     if (s[i])
    358       return i;
    359   return -1;
    360 }
    361 
    362 int __msan_set_poison_in_malloc(int do_poison) {
    363   int old = flags()->poison_in_malloc;
    364   flags()->poison_in_malloc = do_poison;
    365   return old;
    366 }
    367 
    368 int  __msan_has_dynamic_component() {
    369   return msan_running_under_dr;
    370 }
    371 
    372 NOINLINE
    373 void __msan_clear_on_return() {
    374   __msan_param_tls[0] = 0;
    375 }
    376 
    377 static void* get_tls_base() {
    378   u64 p;
    379   asm("mov %%fs:0, %0"
    380       : "=r"(p) ::);
    381   return (void*)p;
    382 }
    383 
    384 int __msan_get_retval_tls_offset() {
    385   // volatile here is needed to avoid UB, because the compiler thinks that we
    386   // are doing address arithmetics on unrelated pointers, and takes some
    387   // shortcuts
    388   volatile sptr retval_tls_p = (sptr)&__msan_retval_tls;
    389   volatile sptr tls_base_p = (sptr)get_tls_base();
    390   return retval_tls_p - tls_base_p;
    391 }
    392 
    393 int __msan_get_param_tls_offset() {
    394   // volatile here is needed to avoid UB, because the compiler thinks that we
    395   // are doing address arithmetics on unrelated pointers, and takes some
    396   // shortcuts
    397   volatile sptr param_tls_p = (sptr)&__msan_param_tls;
    398   volatile sptr tls_base_p = (sptr)get_tls_base();
    399   return param_tls_p - tls_base_p;
    400 }
    401 
    402 void __msan_partial_poison(const void* data, void* shadow, uptr size) {
    403   internal_memcpy((void*)MEM_TO_SHADOW((uptr)data), shadow, size);
    404 }
    405 
    406 void __msan_load_unpoisoned(void *src, uptr size, void *dst) {
    407   internal_memcpy(dst, src, size);
    408   __msan_unpoison(dst, size);
    409 }
    410 
    411 void __msan_set_origin(const void *a, uptr size, u32 origin) {
    412   // Origin mapping is 4 bytes per 4 bytes of application memory.
    413   // Here we extend the range such that its left and right bounds are both
    414   // 4 byte aligned.
    415   if (!__msan_get_track_origins()) return;
    416   uptr x = MEM_TO_ORIGIN((uptr)a);
    417   uptr beg = x & ~3UL;  // align down.
    418   uptr end = (x + size + 3) & ~3UL;  // align up.
    419   u64 origin64 = ((u64)origin << 32) | origin;
    420   // This is like memset, but the value is 32-bit. We unroll by 2 two write
    421   // 64-bits at once. May want to unroll further to get 128-bit stores.
    422   if (beg & 7ULL) {
    423     *(u32*)beg = origin;
    424     beg += 4;
    425   }
    426   for (uptr addr = beg; addr < (end & ~7UL); addr += 8)
    427     *(u64*)addr = origin64;
    428   if (end & 7ULL)
    429     *(u32*)(end - 4) = origin;
    430 }
    431 
    432 // 'descr' is created at compile time and contains '----' in the beginning.
    433 // When we see descr for the first time we replace '----' with a uniq id
    434 // and set the origin to (id | (31-th bit)).
    435 void __msan_set_alloca_origin(void *a, uptr size, const char *descr) {
    436   static const u32 dash = '-';
    437   static const u32 first_timer =
    438       dash + (dash << 8) + (dash << 16) + (dash << 24);
    439   u32 *id_ptr = (u32*)descr;
    440   bool print = false;  // internal_strstr(descr + 4, "AllocaTOTest") != 0;
    441   u32 id = *id_ptr;
    442   if (id == first_timer) {
    443     id = atomic_fetch_add(&NumStackOriginDescrs,
    444                           1, memory_order_relaxed);
    445     *id_ptr = id;
    446     CHECK_LT(id, kNumStackOriginDescrs);
    447     StackOriginDescr[id] = descr + 4;
    448     if (print)
    449       Printf("First time: id=%d %s \n", id, descr + 4);
    450   }
    451   id |= 1U << 31;
    452   if (print)
    453     Printf("__msan_set_alloca_origin: descr=%s id=%x\n", descr + 4, id);
    454   __msan_set_origin(a, size, id);
    455 }
    456 
    457 const char *__msan_get_origin_descr_if_stack(u32 id) {
    458   if ((id >> 31) == 0) return 0;
    459   id &= (1U << 31) - 1;
    460   CHECK_LT(id, kNumStackOriginDescrs);
    461   return StackOriginDescr[id];
    462 }
    463 
    464 
    465 u32 __msan_get_origin(const void *a) {
    466   if (!__msan_get_track_origins()) return 0;
    467   uptr x = (uptr)a;
    468   uptr aligned = x & ~3ULL;
    469   uptr origin_ptr = MEM_TO_ORIGIN(aligned);
    470   return *(u32*)origin_ptr;
    471 }
    472 
    473 u32 __msan_get_umr_origin() {
    474   return __msan_origin_tls;
    475 }
    476 
    477 u16 __sanitizer_unaligned_load16(const uu16 *p) {
    478   __msan_retval_tls[0] = *(uu16 *)MEM_TO_SHADOW((uptr)p);
    479   return *p;
    480 }
    481 u32 __sanitizer_unaligned_load32(const uu32 *p) {
    482   __msan_retval_tls[0] = *(uu32 *)MEM_TO_SHADOW((uptr)p);
    483   return *p;
    484 }
    485 u64 __sanitizer_unaligned_load64(const uu64 *p) {
    486   __msan_retval_tls[0] = *(uu64 *)MEM_TO_SHADOW((uptr)p);
    487   return *p;
    488 }
    489 void __sanitizer_unaligned_store16(uu16 *p, u16 x) {
    490   *(uu16 *)MEM_TO_SHADOW((uptr)p) = __msan_param_tls[1];
    491   *p = x;
    492 }
    493 void __sanitizer_unaligned_store32(uu32 *p, u32 x) {
    494   *(uu32 *)MEM_TO_SHADOW((uptr)p) = __msan_param_tls[1];
    495   *p = x;
    496 }
    497 void __sanitizer_unaligned_store64(uu64 *p, u64 x) {
    498   *(uu64 *)MEM_TO_SHADOW((uptr)p) = __msan_param_tls[1];
    499   *p = x;
    500 }
    501 
    502 #if !SANITIZER_SUPPORTS_WEAK_HOOKS
    503 extern "C" {
    504 SANITIZER_WEAK_ATTRIBUTE SANITIZER_INTERFACE_ATTRIBUTE
    505 const char* __msan_default_options() { return ""; }
    506 }  // extern "C"
    507 #endif
    508 
    509