• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 //===-- msan.cc -----------------------------------------------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file is a part of MemorySanitizer.
11 //
12 // MemorySanitizer runtime.
13 //===----------------------------------------------------------------------===//
14 
15 #include "msan.h"
16 #include "sanitizer_common/sanitizer_atomic.h"
17 #include "sanitizer_common/sanitizer_common.h"
18 #include "sanitizer_common/sanitizer_flags.h"
19 #include "sanitizer_common/sanitizer_libc.h"
20 #include "sanitizer_common/sanitizer_procmaps.h"
21 #include "sanitizer_common/sanitizer_stacktrace.h"
22 #include "sanitizer_common/sanitizer_symbolizer.h"
23 
24 #include "interception/interception.h"
25 
26 // ACHTUNG! No system header includes in this file.
27 
28 using namespace __sanitizer;
29 
30 // Globals.
31 static THREADLOCAL int msan_expect_umr = 0;
32 static THREADLOCAL int msan_expected_umr_found = 0;
33 
34 static int msan_running_under_dr = 0;
35 
36 SANITIZER_INTERFACE_ATTRIBUTE
37 THREADLOCAL u64 __msan_param_tls[kMsanParamTlsSizeInWords];
38 
39 SANITIZER_INTERFACE_ATTRIBUTE
40 THREADLOCAL u32 __msan_param_origin_tls[kMsanParamTlsSizeInWords];
41 
42 SANITIZER_INTERFACE_ATTRIBUTE
43 THREADLOCAL u64 __msan_retval_tls[kMsanRetvalTlsSizeInWords];
44 
45 SANITIZER_INTERFACE_ATTRIBUTE
46 THREADLOCAL u32 __msan_retval_origin_tls;
47 
48 SANITIZER_INTERFACE_ATTRIBUTE
49 THREADLOCAL u64 __msan_va_arg_tls[kMsanParamTlsSizeInWords];
50 
51 SANITIZER_INTERFACE_ATTRIBUTE
52 THREADLOCAL u64 __msan_va_arg_overflow_size_tls;
53 
54 SANITIZER_INTERFACE_ATTRIBUTE
55 THREADLOCAL u32 __msan_origin_tls;
56 
57 static THREADLOCAL struct {
58   uptr stack_top, stack_bottom;
59 } __msan_stack_bounds;
60 
61 static THREADLOCAL bool is_in_symbolizer;
62 static THREADLOCAL bool is_in_loader;
63 
64 extern "C" const int __msan_track_origins;
__msan_get_track_origins()65 int __msan_get_track_origins() {
66   return __msan_track_origins;
67 }
68 
69 namespace __msan {
70 
IsRunningUnderDr()71 static bool IsRunningUnderDr() {
72   bool result = false;
73   MemoryMappingLayout proc_maps;
74   const sptr kBufSize = 4095;
75   char *filename = (char*)MmapOrDie(kBufSize, __FUNCTION__);
76   while (proc_maps.Next(/* start */0, /* end */0, /* file_offset */0,
77                         filename, kBufSize, /* protection */0)) {
78     if (internal_strstr(filename, "libdynamorio") != 0) {
79       result = true;
80       break;
81     }
82   }
83   UnmapOrDie(filename, kBufSize);
84   return result;
85 }
86 
EnterSymbolizer()87 void EnterSymbolizer() { is_in_symbolizer = true; }
ExitSymbolizer()88 void ExitSymbolizer()  { is_in_symbolizer = false; }
IsInSymbolizer()89 bool IsInSymbolizer() { return is_in_symbolizer; }
90 
EnterLoader()91 void EnterLoader() { is_in_loader = true; }
ExitLoader()92 void ExitLoader()  { is_in_loader = false; }
93 
94 extern "C" {
95 SANITIZER_INTERFACE_ATTRIBUTE
__msan_is_in_loader()96 bool __msan_is_in_loader() { return is_in_loader; }
97 }
98 
99 static Flags msan_flags;
100 
flags()101 Flags *flags() {
102   return &msan_flags;
103 }
104 
105 int msan_inited = 0;
106 bool msan_init_is_running;
107 
108 int msan_report_count = 0;
109 
110 // Array of stack origins.
111 // FIXME: make it resizable.
112 static const uptr kNumStackOriginDescrs = 1024 * 1024;
113 static const char *StackOriginDescr[kNumStackOriginDescrs];
114 static atomic_uint32_t NumStackOriginDescrs;
115 
ParseFlagsFromString(Flags * f,const char * str)116 static void ParseFlagsFromString(Flags *f, const char *str) {
117   ParseFlag(str, &f->poison_heap_with_zeroes, "poison_heap_with_zeroes");
118   ParseFlag(str, &f->poison_stack_with_zeroes, "poison_stack_with_zeroes");
119   ParseFlag(str, &f->poison_in_malloc, "poison_in_malloc");
120   ParseFlag(str, &f->exit_code, "exit_code");
121   if (f->exit_code < 0 || f->exit_code > 127) {
122     Printf("Exit code not in [0, 128) range: %d\n", f->exit_code);
123     f->exit_code = 1;
124     Die();
125   }
126   ParseFlag(str, &f->num_callers, "num_callers");
127   ParseFlag(str, &f->report_umrs, "report_umrs");
128   ParseFlag(str, &f->verbosity, "verbosity");
129   ParseFlag(str, &f->strip_path_prefix, "strip_path_prefix");
130   ParseFlag(str, &f->fast_unwind_on_fatal, "fast_unwind_on_fatal");
131   ParseFlag(str, &f->fast_unwind_on_malloc, "fast_unwind_on_malloc");
132 }
133 
InitializeFlags(Flags * f,const char * options)134 static void InitializeFlags(Flags *f, const char *options) {
135   internal_memset(f, 0, sizeof(*f));
136 
137   f->poison_heap_with_zeroes = false;
138   f->poison_stack_with_zeroes = false;
139   f->poison_in_malloc = true;
140   f->exit_code = 77;
141   f->num_callers = 20;
142   f->report_umrs = true;
143   f->verbosity = 0;
144   f->strip_path_prefix = "";
145   f->fast_unwind_on_fatal = false;
146   f->fast_unwind_on_malloc = true;
147 
148   // Override from user-specified string.
149   if (__msan_default_options)
150     ParseFlagsFromString(f, __msan_default_options());
151   ParseFlagsFromString(f, options);
152 }
153 
GetCurrentStackBounds(uptr * stack_top,uptr * stack_bottom)154 static void GetCurrentStackBounds(uptr *stack_top, uptr *stack_bottom) {
155   if (__msan_stack_bounds.stack_top == 0) {
156     // Break recursion (GetStackTrace -> GetThreadStackTopAndBottom ->
157     // realloc -> GetStackTrace).
158     __msan_stack_bounds.stack_top = __msan_stack_bounds.stack_bottom = 1;
159     GetThreadStackTopAndBottom(/* at_initialization */false,
160                                &__msan_stack_bounds.stack_top,
161                                &__msan_stack_bounds.stack_bottom);
162   }
163   *stack_top = __msan_stack_bounds.stack_top;
164   *stack_bottom = __msan_stack_bounds.stack_bottom;
165 }
166 
GetStackTrace(StackTrace * stack,uptr max_s,uptr pc,uptr bp,bool fast)167 void GetStackTrace(StackTrace *stack, uptr max_s, uptr pc, uptr bp,
168                    bool fast) {
169   if (!fast) {
170     // Block reports from our interceptors during _Unwind_Backtrace.
171     SymbolizerScope sym_scope;
172     return stack->SlowUnwindStack(pc, max_s);
173   }
174 
175   uptr stack_top, stack_bottom;
176   GetCurrentStackBounds(&stack_top, &stack_bottom);
177   stack->size = 0;
178   stack->trace[0] = pc;
179   stack->max_size = max_s;
180   stack->FastUnwindStack(pc, bp, stack_top, stack_bottom);
181 }
182 
PrintWarning(uptr pc,uptr bp)183 void PrintWarning(uptr pc, uptr bp) {
184   PrintWarningWithOrigin(pc, bp, __msan_origin_tls);
185 }
186 
OriginIsValid(u32 origin)187 bool OriginIsValid(u32 origin) {
188   return origin != 0 && origin != (u32)-1;
189 }
190 
PrintWarningWithOrigin(uptr pc,uptr bp,u32 origin)191 void PrintWarningWithOrigin(uptr pc, uptr bp, u32 origin) {
192   if (msan_expect_umr) {
193     // Printf("Expected UMR\n");
194     __msan_origin_tls = origin;
195     msan_expected_umr_found = 1;
196     return;
197   }
198 
199   ++msan_report_count;
200 
201   StackTrace stack;
202   GetStackTrace(&stack, kStackTraceMax, pc, bp, flags()->fast_unwind_on_fatal);
203 
204   u32 report_origin =
205     (__msan_track_origins && OriginIsValid(origin)) ? origin : 0;
206   ReportUMR(&stack, report_origin);
207 
208   if (__msan_track_origins && !OriginIsValid(origin)) {
209     Printf("  ORIGIN: invalid (%x). Might be a bug in MemorySanitizer, "
210            "please report to MemorySanitizer developers.\n",
211            origin);
212   }
213 }
214 
215 }  // namespace __msan
216 
217 // Interface.
218 
219 using namespace __msan;
220 
__msan_warning()221 void __msan_warning() {
222   GET_CALLER_PC_BP_SP;
223   (void)sp;
224   PrintWarning(pc, bp);
225 }
226 
__msan_warning_noreturn()227 void __msan_warning_noreturn() {
228   GET_CALLER_PC_BP_SP;
229   (void)sp;
230   PrintWarning(pc, bp);
231   Printf("Exiting\n");
232   Die();
233 }
234 
__msan_init()235 void __msan_init() {
236   if (msan_inited) return;
237   msan_init_is_running = 1;
238   SanitizerToolName = "MemorySanitizer";
239 
240   InstallAtExitHandler();
241   SetDieCallback(MsanDie);
242   InitTlsSize();
243   InitializeInterceptors();
244 
245   ReplaceOperatorsNewAndDelete();
246   const char *msan_options = GetEnv("MSAN_OPTIONS");
247   InitializeFlags(&msan_flags, msan_options);
248   if (StackSizeIsUnlimited()) {
249     if (flags()->verbosity)
250       Printf("Unlimited stack, doing reexec\n");
251     // A reasonably large stack size. It is bigger than the usual 8Mb, because,
252     // well, the program could have been run with unlimited stack for a reason.
253     SetStackSizeLimitInBytes(32 * 1024 * 1024);
254     ReExec();
255   }
256 
257   if (flags()->verbosity)
258     Printf("MSAN_OPTIONS: %s\n", msan_options ? msan_options : "<empty>");
259 
260   msan_running_under_dr = IsRunningUnderDr();
261   __msan_clear_on_return();
262   if (__msan_track_origins && flags()->verbosity > 0)
263     Printf("msan_track_origins\n");
264   if (!InitShadow(/* prot1 */false, /* prot2 */true, /* map_shadow */true,
265                   __msan_track_origins)) {
266     // FIXME: prot1 = false is only required when running under DR.
267     Printf("FATAL: MemorySanitizer can not mmap the shadow memory.\n");
268     Printf("FATAL: Make sure to compile with -fPIE and to link with -pie.\n");
269     Printf("FATAL: Disabling ASLR is known to cause this error.\n");
270     Printf("FATAL: If running under GDB, try "
271            "'set disable-randomization off'.\n");
272     DumpProcessMap();
273     Die();
274   }
275 
276   const char *external_symbolizer = GetEnv("MSAN_SYMBOLIZER_PATH");
277   if (external_symbolizer && external_symbolizer[0]) {
278     CHECK(InitializeExternalSymbolizer(external_symbolizer));
279   }
280 
281   GetThreadStackTopAndBottom(/* at_initialization */true,
282                              &__msan_stack_bounds.stack_top,
283                              &__msan_stack_bounds.stack_bottom);
284   if (flags()->verbosity)
285     Printf("MemorySanitizer init done\n");
286   msan_init_is_running = 0;
287   msan_inited = 1;
288 }
289 
__msan_set_exit_code(int exit_code)290 void __msan_set_exit_code(int exit_code) {
291   flags()->exit_code = exit_code;
292 }
293 
__msan_set_expect_umr(int expect_umr)294 void __msan_set_expect_umr(int expect_umr) {
295   if (expect_umr) {
296     msan_expected_umr_found = 0;
297   } else if (!msan_expected_umr_found) {
298     GET_CALLER_PC_BP_SP;
299     (void)sp;
300     StackTrace stack;
301     GetStackTrace(&stack, kStackTraceMax, pc, bp,
302                   flags()->fast_unwind_on_fatal);
303     ReportExpectedUMRNotFound(&stack);
304     Die();
305   }
306   msan_expect_umr = expect_umr;
307 }
308 
__msan_print_shadow(const void * x,uptr size)309 void __msan_print_shadow(const void *x, uptr size) {
310   unsigned char *s = (unsigned char*)MEM_TO_SHADOW(x);
311   u32 *o = (u32*)MEM_TO_ORIGIN(x);
312   for (uptr i = 0; i < size; i++) {
313     Printf("%x%x ", s[i] >> 4, s[i] & 0xf);
314   }
315   Printf("\n");
316   if (__msan_track_origins) {
317     for (uptr i = 0; i < size / 4; i++) {
318       Printf(" o: %x ", o[i]);
319     }
320     Printf("\n");
321   }
322 }
323 
__msan_print_param_shadow()324 void __msan_print_param_shadow() {
325   for (int i = 0; i < 16; i++) {
326     Printf("#%d:%zx ", i, __msan_param_tls[i]);
327   }
328   Printf("\n");
329 }
330 
__msan_test_shadow(const void * x,uptr size)331 sptr __msan_test_shadow(const void *x, uptr size) {
332   unsigned char *s = (unsigned char*)MEM_TO_SHADOW((uptr)x);
333   for (uptr i = 0; i < size; ++i)
334     if (s[i])
335       return i;
336   return -1;
337 }
338 
__msan_set_poison_in_malloc(int do_poison)339 int __msan_set_poison_in_malloc(int do_poison) {
340   int old = flags()->poison_in_malloc;
341   flags()->poison_in_malloc = do_poison;
342   return old;
343 }
344 
__msan_has_dynamic_component()345 int  __msan_has_dynamic_component() {
346   return msan_running_under_dr;
347 }
348 
349 NOINLINE
__msan_clear_on_return()350 void __msan_clear_on_return() {
351   __msan_param_tls[0] = 0;
352 }
353 
get_tls_base()354 static void* get_tls_base() {
355   u64 p;
356   asm("mov %%fs:0, %0"
357       : "=r"(p) ::);
358   return (void*)p;
359 }
360 
__msan_get_retval_tls_offset()361 int __msan_get_retval_tls_offset() {
362   // volatile here is needed to avoid UB, because the compiler thinks that we
363   // are doing address arithmetics on unrelated pointers, and takes some
364   // shortcuts
365   volatile sptr retval_tls_p = (sptr)&__msan_retval_tls;
366   volatile sptr tls_base_p = (sptr)get_tls_base();
367   return retval_tls_p - tls_base_p;
368 }
369 
__msan_get_param_tls_offset()370 int __msan_get_param_tls_offset() {
371   // volatile here is needed to avoid UB, because the compiler thinks that we
372   // are doing address arithmetics on unrelated pointers, and takes some
373   // shortcuts
374   volatile sptr param_tls_p = (sptr)&__msan_param_tls;
375   volatile sptr tls_base_p = (sptr)get_tls_base();
376   return param_tls_p - tls_base_p;
377 }
378 
__msan_partial_poison(void * data,void * shadow,uptr size)379 void __msan_partial_poison(void* data, void* shadow, uptr size) {
380   internal_memcpy((void*)MEM_TO_SHADOW((uptr)data), shadow, size);
381 }
382 
__msan_load_unpoisoned(void * src,uptr size,void * dst)383 void __msan_load_unpoisoned(void *src, uptr size, void *dst) {
384   internal_memcpy(dst, src, size);
385   __msan_unpoison(dst, size);
386 }
387 
__msan_set_origin(void * a,uptr size,u32 origin)388 void __msan_set_origin(void *a, uptr size, u32 origin) {
389   // Origin mapping is 4 bytes per 4 bytes of application memory.
390   // Here we extend the range such that its left and right bounds are both
391   // 4 byte aligned.
392   if (!__msan_track_origins) return;
393   uptr x = MEM_TO_ORIGIN((uptr)a);
394   uptr beg = x & ~3UL;  // align down.
395   uptr end = (x + size + 3) & ~3UL;  // align up.
396   u64 origin64 = ((u64)origin << 32) | origin;
397   // This is like memset, but the value is 32-bit. We unroll by 2 two write
398   // 64-bits at once. May want to unroll further to get 128-bit stores.
399   if (beg & 7ULL) {
400     *(u32*)beg = origin;
401     beg += 4;
402   }
403   for (uptr addr = beg; addr < (end & ~7UL); addr += 8)
404     *(u64*)addr = origin64;
405   if (end & 7ULL)
406     *(u32*)(end - 4) = origin;
407 }
408 
409 // 'descr' is created at compile time and contains '----' in the beginning.
410 // When we see descr for the first time we replace '----' with a uniq id
411 // and set the origin to (id | (31-th bit)).
__msan_set_alloca_origin(void * a,uptr size,const char * descr)412 void __msan_set_alloca_origin(void *a, uptr size, const char *descr) {
413   static const u32 dash = '-';
414   static const u32 first_timer =
415       dash + (dash << 8) + (dash << 16) + (dash << 24);
416   u32 *id_ptr = (u32*)descr;
417   bool print = false;  // internal_strstr(descr + 4, "AllocaTOTest") != 0;
418   u32 id = *id_ptr;
419   if (id == first_timer) {
420     id = atomic_fetch_add(&NumStackOriginDescrs,
421                           1, memory_order_relaxed);
422     *id_ptr = id;
423     CHECK_LT(id, kNumStackOriginDescrs);
424     StackOriginDescr[id] = descr + 4;
425     if (print)
426       Printf("First time: id=%d %s \n", id, descr + 4);
427   }
428   id |= 1U << 31;
429   if (print)
430     Printf("__msan_set_alloca_origin: descr=%s id=%x\n", descr + 4, id);
431   __msan_set_origin(a, size, id);
432 }
433 
__msan_get_origin_descr_if_stack(u32 id)434 const char *__msan_get_origin_descr_if_stack(u32 id) {
435   if ((id >> 31) == 0) return 0;
436   id &= (1U << 31) - 1;
437   CHECK_LT(id, kNumStackOriginDescrs);
438   return StackOriginDescr[id];
439 }
440 
441 
__msan_get_origin(void * a)442 u32 __msan_get_origin(void *a) {
443   if (!__msan_track_origins) return 0;
444   uptr x = (uptr)a;
445   uptr aligned = x & ~3ULL;
446   uptr origin_ptr = MEM_TO_ORIGIN(aligned);
447   return *(u32*)origin_ptr;
448 }
449 
__msan_get_umr_origin()450 u32 __msan_get_umr_origin() {
451   return __msan_origin_tls;
452 }
453 
454 #if !SANITIZER_SUPPORTS_WEAK_HOOKS
455 extern "C" {
456 SANITIZER_WEAK_ATTRIBUTE SANITIZER_INTERFACE_ATTRIBUTE
__msan_default_options()457 const char* __msan_default_options() { return ""; }
458 }  // extern "C"
459 #endif
460 
461