//===-- msan.cc -----------------------------------------------------------===// // // The LLVM Compiler Infrastructure // // This file is distributed under the University of Illinois Open Source // License. See LICENSE.TXT for details. // //===----------------------------------------------------------------------===// // // This file is a part of MemorySanitizer. // // MemorySanitizer runtime. //===----------------------------------------------------------------------===// #include "msan.h" #include "sanitizer_common/sanitizer_atomic.h" #include "sanitizer_common/sanitizer_common.h" #include "sanitizer_common/sanitizer_flags.h" #include "sanitizer_common/sanitizer_libc.h" #include "sanitizer_common/sanitizer_procmaps.h" #include "sanitizer_common/sanitizer_stacktrace.h" #include "sanitizer_common/sanitizer_symbolizer.h" #include "interception/interception.h" // ACHTUNG! No system header includes in this file. using namespace __sanitizer; // Globals. static THREADLOCAL int msan_expect_umr = 0; static THREADLOCAL int msan_expected_umr_found = 0; static int msan_running_under_dr = 0; SANITIZER_INTERFACE_ATTRIBUTE THREADLOCAL u64 __msan_param_tls[kMsanParamTlsSizeInWords]; SANITIZER_INTERFACE_ATTRIBUTE THREADLOCAL u32 __msan_param_origin_tls[kMsanParamTlsSizeInWords]; SANITIZER_INTERFACE_ATTRIBUTE THREADLOCAL u64 __msan_retval_tls[kMsanRetvalTlsSizeInWords]; SANITIZER_INTERFACE_ATTRIBUTE THREADLOCAL u32 __msan_retval_origin_tls; SANITIZER_INTERFACE_ATTRIBUTE THREADLOCAL u64 __msan_va_arg_tls[kMsanParamTlsSizeInWords]; SANITIZER_INTERFACE_ATTRIBUTE THREADLOCAL u64 __msan_va_arg_overflow_size_tls; SANITIZER_INTERFACE_ATTRIBUTE THREADLOCAL u32 __msan_origin_tls; static THREADLOCAL struct { uptr stack_top, stack_bottom; } __msan_stack_bounds; static THREADLOCAL bool is_in_symbolizer; static THREADLOCAL bool is_in_loader; extern "C" const int __msan_track_origins; int __msan_get_track_origins() { return __msan_track_origins; } namespace __msan { static bool IsRunningUnderDr() { bool result = false; MemoryMappingLayout proc_maps; const sptr kBufSize = 4095; char *filename = (char*)MmapOrDie(kBufSize, __FUNCTION__); while (proc_maps.Next(/* start */0, /* end */0, /* file_offset */0, filename, kBufSize, /* protection */0)) { if (internal_strstr(filename, "libdynamorio") != 0) { result = true; break; } } UnmapOrDie(filename, kBufSize); return result; } void EnterSymbolizer() { is_in_symbolizer = true; } void ExitSymbolizer() { is_in_symbolizer = false; } bool IsInSymbolizer() { return is_in_symbolizer; } void EnterLoader() { is_in_loader = true; } void ExitLoader() { is_in_loader = false; } extern "C" { SANITIZER_INTERFACE_ATTRIBUTE bool __msan_is_in_loader() { return is_in_loader; } } static Flags msan_flags; Flags *flags() { return &msan_flags; } int msan_inited = 0; bool msan_init_is_running; int msan_report_count = 0; // Array of stack origins. // FIXME: make it resizable. static const uptr kNumStackOriginDescrs = 1024 * 1024; static const char *StackOriginDescr[kNumStackOriginDescrs]; static atomic_uint32_t NumStackOriginDescrs; static void ParseFlagsFromString(Flags *f, const char *str) { ParseFlag(str, &f->poison_heap_with_zeroes, "poison_heap_with_zeroes"); ParseFlag(str, &f->poison_stack_with_zeroes, "poison_stack_with_zeroes"); ParseFlag(str, &f->poison_in_malloc, "poison_in_malloc"); ParseFlag(str, &f->exit_code, "exit_code"); if (f->exit_code < 0 || f->exit_code > 127) { Printf("Exit code not in [0, 128) range: %d\n", f->exit_code); f->exit_code = 1; Die(); } ParseFlag(str, &f->num_callers, "num_callers"); ParseFlag(str, &f->report_umrs, "report_umrs"); ParseFlag(str, &f->verbosity, "verbosity"); ParseFlag(str, &f->strip_path_prefix, "strip_path_prefix"); ParseFlag(str, &f->fast_unwind_on_fatal, "fast_unwind_on_fatal"); ParseFlag(str, &f->fast_unwind_on_malloc, "fast_unwind_on_malloc"); } static void InitializeFlags(Flags *f, const char *options) { internal_memset(f, 0, sizeof(*f)); f->poison_heap_with_zeroes = false; f->poison_stack_with_zeroes = false; f->poison_in_malloc = true; f->exit_code = 77; f->num_callers = 20; f->report_umrs = true; f->verbosity = 0; f->strip_path_prefix = ""; f->fast_unwind_on_fatal = false; f->fast_unwind_on_malloc = true; // Override from user-specified string. if (__msan_default_options) ParseFlagsFromString(f, __msan_default_options()); ParseFlagsFromString(f, options); } static void GetCurrentStackBounds(uptr *stack_top, uptr *stack_bottom) { if (__msan_stack_bounds.stack_top == 0) { // Break recursion (GetStackTrace -> GetThreadStackTopAndBottom -> // realloc -> GetStackTrace). __msan_stack_bounds.stack_top = __msan_stack_bounds.stack_bottom = 1; GetThreadStackTopAndBottom(/* at_initialization */false, &__msan_stack_bounds.stack_top, &__msan_stack_bounds.stack_bottom); } *stack_top = __msan_stack_bounds.stack_top; *stack_bottom = __msan_stack_bounds.stack_bottom; } void GetStackTrace(StackTrace *stack, uptr max_s, uptr pc, uptr bp, bool fast) { if (!fast) { // Block reports from our interceptors during _Unwind_Backtrace. SymbolizerScope sym_scope; return stack->SlowUnwindStack(pc, max_s); } uptr stack_top, stack_bottom; GetCurrentStackBounds(&stack_top, &stack_bottom); stack->size = 0; stack->trace[0] = pc; stack->max_size = max_s; stack->FastUnwindStack(pc, bp, stack_top, stack_bottom); } void PrintWarning(uptr pc, uptr bp) { PrintWarningWithOrigin(pc, bp, __msan_origin_tls); } bool OriginIsValid(u32 origin) { return origin != 0 && origin != (u32)-1; } void PrintWarningWithOrigin(uptr pc, uptr bp, u32 origin) { if (msan_expect_umr) { // Printf("Expected UMR\n"); __msan_origin_tls = origin; msan_expected_umr_found = 1; return; } ++msan_report_count; StackTrace stack; GetStackTrace(&stack, kStackTraceMax, pc, bp, flags()->fast_unwind_on_fatal); u32 report_origin = (__msan_track_origins && OriginIsValid(origin)) ? origin : 0; ReportUMR(&stack, report_origin); if (__msan_track_origins && !OriginIsValid(origin)) { Printf(" ORIGIN: invalid (%x). Might be a bug in MemorySanitizer, " "please report to MemorySanitizer developers.\n", origin); } } } // namespace __msan // Interface. using namespace __msan; void __msan_warning() { GET_CALLER_PC_BP_SP; (void)sp; PrintWarning(pc, bp); } void __msan_warning_noreturn() { GET_CALLER_PC_BP_SP; (void)sp; PrintWarning(pc, bp); Printf("Exiting\n"); Die(); } void __msan_init() { if (msan_inited) return; msan_init_is_running = 1; SanitizerToolName = "MemorySanitizer"; InstallAtExitHandler(); SetDieCallback(MsanDie); InitTlsSize(); InitializeInterceptors(); ReplaceOperatorsNewAndDelete(); const char *msan_options = GetEnv("MSAN_OPTIONS"); InitializeFlags(&msan_flags, msan_options); if (StackSizeIsUnlimited()) { if (flags()->verbosity) Printf("Unlimited stack, doing reexec\n"); // A reasonably large stack size. It is bigger than the usual 8Mb, because, // well, the program could have been run with unlimited stack for a reason. SetStackSizeLimitInBytes(32 * 1024 * 1024); ReExec(); } if (flags()->verbosity) Printf("MSAN_OPTIONS: %s\n", msan_options ? msan_options : "<empty>"); msan_running_under_dr = IsRunningUnderDr(); __msan_clear_on_return(); if (__msan_track_origins && flags()->verbosity > 0) Printf("msan_track_origins\n"); if (!InitShadow(/* prot1 */false, /* prot2 */true, /* map_shadow */true, __msan_track_origins)) { // FIXME: prot1 = false is only required when running under DR. Printf("FATAL: MemorySanitizer can not mmap the shadow memory.\n"); Printf("FATAL: Make sure to compile with -fPIE and to link with -pie.\n"); Printf("FATAL: Disabling ASLR is known to cause this error.\n"); Printf("FATAL: If running under GDB, try " "'set disable-randomization off'.\n"); DumpProcessMap(); Die(); } const char *external_symbolizer = GetEnv("MSAN_SYMBOLIZER_PATH"); if (external_symbolizer && external_symbolizer[0]) { CHECK(InitializeExternalSymbolizer(external_symbolizer)); } GetThreadStackTopAndBottom(/* at_initialization */true, &__msan_stack_bounds.stack_top, &__msan_stack_bounds.stack_bottom); if (flags()->verbosity) Printf("MemorySanitizer init done\n"); msan_init_is_running = 0; msan_inited = 1; } void __msan_set_exit_code(int exit_code) { flags()->exit_code = exit_code; } void __msan_set_expect_umr(int expect_umr) { if (expect_umr) { msan_expected_umr_found = 0; } else if (!msan_expected_umr_found) { GET_CALLER_PC_BP_SP; (void)sp; StackTrace stack; GetStackTrace(&stack, kStackTraceMax, pc, bp, flags()->fast_unwind_on_fatal); ReportExpectedUMRNotFound(&stack); Die(); } msan_expect_umr = expect_umr; } void __msan_print_shadow(const void *x, uptr size) { unsigned char *s = (unsigned char*)MEM_TO_SHADOW(x); u32 *o = (u32*)MEM_TO_ORIGIN(x); for (uptr i = 0; i < size; i++) { Printf("%x%x ", s[i] >> 4, s[i] & 0xf); } Printf("\n"); if (__msan_track_origins) { for (uptr i = 0; i < size / 4; i++) { Printf(" o: %x ", o[i]); } Printf("\n"); } } void __msan_print_param_shadow() { for (int i = 0; i < 16; i++) { Printf("#%d:%zx ", i, __msan_param_tls[i]); } Printf("\n"); } sptr __msan_test_shadow(const void *x, uptr size) { unsigned char *s = (unsigned char*)MEM_TO_SHADOW((uptr)x); for (uptr i = 0; i < size; ++i) if (s[i]) return i; return -1; } int __msan_set_poison_in_malloc(int do_poison) { int old = flags()->poison_in_malloc; flags()->poison_in_malloc = do_poison; return old; } int __msan_has_dynamic_component() { return msan_running_under_dr; } NOINLINE void __msan_clear_on_return() { __msan_param_tls[0] = 0; } static void* get_tls_base() { u64 p; asm("mov %%fs:0, %0" : "=r"(p) ::); return (void*)p; } int __msan_get_retval_tls_offset() { // volatile here is needed to avoid UB, because the compiler thinks that we // are doing address arithmetics on unrelated pointers, and takes some // shortcuts volatile sptr retval_tls_p = (sptr)&__msan_retval_tls; volatile sptr tls_base_p = (sptr)get_tls_base(); return retval_tls_p - tls_base_p; } int __msan_get_param_tls_offset() { // volatile here is needed to avoid UB, because the compiler thinks that we // are doing address arithmetics on unrelated pointers, and takes some // shortcuts volatile sptr param_tls_p = (sptr)&__msan_param_tls; volatile sptr tls_base_p = (sptr)get_tls_base(); return param_tls_p - tls_base_p; } void __msan_partial_poison(void* data, void* shadow, uptr size) { internal_memcpy((void*)MEM_TO_SHADOW((uptr)data), shadow, size); } void __msan_load_unpoisoned(void *src, uptr size, void *dst) { internal_memcpy(dst, src, size); __msan_unpoison(dst, size); } void __msan_set_origin(void *a, uptr size, u32 origin) { // Origin mapping is 4 bytes per 4 bytes of application memory. // Here we extend the range such that its left and right bounds are both // 4 byte aligned. if (!__msan_track_origins) return; uptr x = MEM_TO_ORIGIN((uptr)a); uptr beg = x & ~3UL; // align down. uptr end = (x + size + 3) & ~3UL; // align up. u64 origin64 = ((u64)origin << 32) | origin; // This is like memset, but the value is 32-bit. We unroll by 2 two write // 64-bits at once. May want to unroll further to get 128-bit stores. if (beg & 7ULL) { *(u32*)beg = origin; beg += 4; } for (uptr addr = beg; addr < (end & ~7UL); addr += 8) *(u64*)addr = origin64; if (end & 7ULL) *(u32*)(end - 4) = origin; } // 'descr' is created at compile time and contains '----' in the beginning. // When we see descr for the first time we replace '----' with a uniq id // and set the origin to (id | (31-th bit)). void __msan_set_alloca_origin(void *a, uptr size, const char *descr) { static const u32 dash = '-'; static const u32 first_timer = dash + (dash << 8) + (dash << 16) + (dash << 24); u32 *id_ptr = (u32*)descr; bool print = false; // internal_strstr(descr + 4, "AllocaTOTest") != 0; u32 id = *id_ptr; if (id == first_timer) { id = atomic_fetch_add(&NumStackOriginDescrs, 1, memory_order_relaxed); *id_ptr = id; CHECK_LT(id, kNumStackOriginDescrs); StackOriginDescr[id] = descr + 4; if (print) Printf("First time: id=%d %s \n", id, descr + 4); } id |= 1U << 31; if (print) Printf("__msan_set_alloca_origin: descr=%s id=%x\n", descr + 4, id); __msan_set_origin(a, size, id); } const char *__msan_get_origin_descr_if_stack(u32 id) { if ((id >> 31) == 0) return 0; id &= (1U << 31) - 1; CHECK_LT(id, kNumStackOriginDescrs); return StackOriginDescr[id]; } u32 __msan_get_origin(void *a) { if (!__msan_track_origins) return 0; uptr x = (uptr)a; uptr aligned = x & ~3ULL; uptr origin_ptr = MEM_TO_ORIGIN(aligned); return *(u32*)origin_ptr; } u32 __msan_get_umr_origin() { return __msan_origin_tls; } #if !SANITIZER_SUPPORTS_WEAK_HOOKS extern "C" { SANITIZER_WEAK_ATTRIBUTE SANITIZER_INTERFACE_ATTRIBUTE const char* __msan_default_options() { return ""; } } // extern "C" #endif