msan.cc revision a537ea99d3dcc4b2dc0033aee7ad5cb1b378efc7
1//===-- msan.cc -----------------------------------------------------------===//
2//
3//                     The LLVM Compiler Infrastructure
4//
5// This file is distributed under the University of Illinois Open Source
6// License. See LICENSE.TXT for details.
7//
8//===----------------------------------------------------------------------===//
9//
10// This file is a part of MemorySanitizer.
11//
12// MemorySanitizer runtime.
13//===----------------------------------------------------------------------===//
14
15#include "msan.h"
16#include "sanitizer_common/sanitizer_atomic.h"
17#include "sanitizer_common/sanitizer_common.h"
18#include "sanitizer_common/sanitizer_flags.h"
19#include "sanitizer_common/sanitizer_libc.h"
20#include "sanitizer_common/sanitizer_procmaps.h"
21#include "sanitizer_common/sanitizer_stacktrace.h"
22#include "sanitizer_common/sanitizer_symbolizer.h"
23
24#include "interception/interception.h"
25
26// ACHTUNG! No system header includes in this file.
27
28using namespace __sanitizer;
29
30// Globals.
31static THREADLOCAL int msan_expect_umr = 0;
32static THREADLOCAL int msan_expected_umr_found = 0;
33
34static int msan_running_under_dr = 0;
35
36SANITIZER_INTERFACE_ATTRIBUTE
37THREADLOCAL u64 __msan_param_tls[kMsanParamTlsSizeInWords];
38
39SANITIZER_INTERFACE_ATTRIBUTE
40THREADLOCAL u32 __msan_param_origin_tls[kMsanParamTlsSizeInWords];
41
42SANITIZER_INTERFACE_ATTRIBUTE
43THREADLOCAL u64 __msan_retval_tls[kMsanRetvalTlsSizeInWords];
44
45SANITIZER_INTERFACE_ATTRIBUTE
46THREADLOCAL u32 __msan_retval_origin_tls;
47
48SANITIZER_INTERFACE_ATTRIBUTE
49THREADLOCAL u64 __msan_va_arg_tls[kMsanParamTlsSizeInWords];
50
51SANITIZER_INTERFACE_ATTRIBUTE
52THREADLOCAL u64 __msan_va_arg_overflow_size_tls;
53
54SANITIZER_INTERFACE_ATTRIBUTE
55THREADLOCAL u32 __msan_origin_tls;
56
57static THREADLOCAL struct {
58  uptr stack_top, stack_bottom;
59} __msan_stack_bounds;
60
61static THREADLOCAL int is_in_symbolizer;
62static THREADLOCAL int is_in_loader;
63
64extern "C" SANITIZER_WEAK_ATTRIBUTE const int __msan_track_origins;
65
66int __msan_get_track_origins() {
67  return &__msan_track_origins ? __msan_track_origins : 0;
68}
69
70extern "C" SANITIZER_WEAK_ATTRIBUTE const int __msan_keep_going;
71
72namespace __msan {
73
74static bool IsRunningUnderDr() {
75  bool result = false;
76  MemoryMappingLayout proc_maps(/*cache_enabled*/true);
77  const sptr kBufSize = 4095;
78  char *filename = (char*)MmapOrDie(kBufSize, __FUNCTION__);
79  while (proc_maps.Next(/* start */0, /* end */0, /* file_offset */0,
80                        filename, kBufSize, /* protection */0)) {
81    if (internal_strstr(filename, "libdynamorio") != 0) {
82      result = true;
83      break;
84    }
85  }
86  UnmapOrDie(filename, kBufSize);
87  return result;
88}
89
90void EnterSymbolizer() { ++is_in_symbolizer; }
91void ExitSymbolizer()  { --is_in_symbolizer; }
92bool IsInSymbolizer() { return is_in_symbolizer; }
93
94void EnterLoader() { ++is_in_loader; }
95void ExitLoader()  { --is_in_loader; }
96
97extern "C" {
98SANITIZER_INTERFACE_ATTRIBUTE
99bool __msan_is_in_loader() { return is_in_loader; }
100}
101
102static Flags msan_flags;
103
104Flags *flags() {
105  return &msan_flags;
106}
107
108int msan_inited = 0;
109bool msan_init_is_running;
110
111int msan_report_count = 0;
112
113// Array of stack origins.
114// FIXME: make it resizable.
115static const uptr kNumStackOriginDescrs = 1024 * 1024;
116static const char *StackOriginDescr[kNumStackOriginDescrs];
117static uptr StackOriginPC[kNumStackOriginDescrs];
118static atomic_uint32_t NumStackOriginDescrs;
119
120static void ParseFlagsFromString(Flags *f, const char *str) {
121  ParseCommonFlagsFromString(str);
122  ParseFlag(str, &f->poison_heap_with_zeroes, "poison_heap_with_zeroes");
123  ParseFlag(str, &f->poison_stack_with_zeroes, "poison_stack_with_zeroes");
124  ParseFlag(str, &f->poison_in_malloc, "poison_in_malloc");
125  ParseFlag(str, &f->poison_in_free, "poison_in_free");
126  ParseFlag(str, &f->exit_code, "exit_code");
127  if (f->exit_code < 0 || f->exit_code > 127) {
128    Printf("Exit code not in [0, 128) range: %d\n", f->exit_code);
129    Die();
130  }
131  ParseFlag(str, &f->report_umrs, "report_umrs");
132  ParseFlag(str, &f->wrap_signals, "wrap_signals");
133
134  // keep_going is an old name for halt_on_error,
135  // and it has inverse meaning.
136  f->halt_on_error = !f->halt_on_error;
137  ParseFlag(str, &f->halt_on_error, "keep_going");
138  f->halt_on_error = !f->halt_on_error;
139  ParseFlag(str, &f->halt_on_error, "halt_on_error");
140}
141
142static void InitializeFlags(Flags *f, const char *options) {
143  CommonFlags *cf = common_flags();
144  cf->external_symbolizer_path = GetEnv("MSAN_SYMBOLIZER_PATH");
145  cf->symbolize = true;
146  cf->strip_path_prefix = "";
147  cf->fast_unwind_on_fatal = false;
148  cf->fast_unwind_on_malloc = true;
149  cf->malloc_context_size = 20;
150  cf->handle_ioctl = true;
151  cf->log_path = 0;
152
153  internal_memset(f, 0, sizeof(*f));
154  f->poison_heap_with_zeroes = false;
155  f->poison_stack_with_zeroes = false;
156  f->poison_in_malloc = true;
157  f->poison_in_free = true;
158  f->exit_code = 77;
159  f->report_umrs = true;
160  f->wrap_signals = true;
161  f->halt_on_error = !&__msan_keep_going;
162
163  // Override from user-specified string.
164  if (__msan_default_options)
165    ParseFlagsFromString(f, __msan_default_options());
166  ParseFlagsFromString(f, options);
167}
168
169static void GetCurrentStackBounds(uptr *stack_top, uptr *stack_bottom) {
170  if (__msan_stack_bounds.stack_top == 0) {
171    // Break recursion (GetStackTrace -> GetThreadStackTopAndBottom ->
172    // realloc -> GetStackTrace).
173    __msan_stack_bounds.stack_top = __msan_stack_bounds.stack_bottom = 1;
174    GetThreadStackTopAndBottom(/* at_initialization */false,
175                               &__msan_stack_bounds.stack_top,
176                               &__msan_stack_bounds.stack_bottom);
177  }
178  *stack_top = __msan_stack_bounds.stack_top;
179  *stack_bottom = __msan_stack_bounds.stack_bottom;
180}
181
182void GetStackTrace(StackTrace *stack, uptr max_s, uptr pc, uptr bp,
183                   bool request_fast_unwind) {
184  if (!StackTrace::WillUseFastUnwind(request_fast_unwind)) {
185    // Block reports from our interceptors during _Unwind_Backtrace.
186    SymbolizerScope sym_scope;
187    return stack->Unwind(max_s, pc, bp, 0, 0, request_fast_unwind);
188  }
189  uptr stack_top, stack_bottom;
190  GetCurrentStackBounds(&stack_top, &stack_bottom);
191  stack->Unwind(max_s, pc, bp, stack_top, stack_bottom, request_fast_unwind);
192}
193
194void PrintWarning(uptr pc, uptr bp) {
195  PrintWarningWithOrigin(pc, bp, __msan_origin_tls);
196}
197
198bool OriginIsValid(u32 origin) {
199  return origin != 0 && origin != (u32)-1;
200}
201
202void PrintWarningWithOrigin(uptr pc, uptr bp, u32 origin) {
203  if (msan_expect_umr) {
204    // Printf("Expected UMR\n");
205    __msan_origin_tls = origin;
206    msan_expected_umr_found = 1;
207    return;
208  }
209
210  ++msan_report_count;
211
212  StackTrace stack;
213  GetStackTrace(&stack, kStackTraceMax, pc, bp,
214                common_flags()->fast_unwind_on_fatal);
215
216  u32 report_origin =
217    (__msan_get_track_origins() && OriginIsValid(origin)) ? origin : 0;
218  ReportUMR(&stack, report_origin);
219
220  if (__msan_get_track_origins() && !OriginIsValid(origin)) {
221    Printf(
222        "  ORIGIN: invalid (%x). Might be a bug in MemorySanitizer origin "
223        "tracking.\n    This could still be a bug in your code, too!\n",
224        origin);
225  }
226}
227
228void UnpoisonParam(uptr n) {
229  internal_memset(__msan_param_tls, 0, n * sizeof(*__msan_param_tls));
230}
231
232// Backup MSan runtime TLS state.
233// Implementation must be async-signal-safe.
234// Instances of this class may live on the signal handler stack, and data size
235// may be an issue.
236void ScopedThreadLocalStateBackup::Backup() {
237  va_arg_overflow_size_tls = __msan_va_arg_overflow_size_tls;
238}
239
240void ScopedThreadLocalStateBackup::Restore() {
241  // A lame implementation that only keeps essential state and resets the rest.
242  __msan_va_arg_overflow_size_tls = va_arg_overflow_size_tls;
243
244  internal_memset(__msan_param_tls, 0, sizeof(__msan_param_tls));
245  internal_memset(__msan_retval_tls, 0, sizeof(__msan_retval_tls));
246  internal_memset(__msan_va_arg_tls, 0, sizeof(__msan_va_arg_tls));
247
248  if (__msan_get_track_origins()) {
249    internal_memset(&__msan_retval_origin_tls, 0, sizeof(__msan_retval_tls));
250    internal_memset(__msan_param_origin_tls, 0,
251                    sizeof(__msan_param_origin_tls));
252  }
253}
254
255void UnpoisonThreadLocalState() {
256}
257
258const char *GetOriginDescrIfStack(u32 id, uptr *pc) {
259  if ((id >> 31) == 0) return 0;
260  id &= (1U << 31) - 1;
261  CHECK_LT(id, kNumStackOriginDescrs);
262  if (pc) *pc = StackOriginPC[id];
263  return StackOriginDescr[id];
264}
265
266}  // namespace __msan
267
268// Interface.
269
270using namespace __msan;
271
272void __msan_warning() {
273  GET_CALLER_PC_BP_SP;
274  (void)sp;
275  PrintWarning(pc, bp);
276  if (__msan::flags()->halt_on_error) {
277    Printf("Exiting\n");
278    Die();
279  }
280}
281
282void __msan_warning_noreturn() {
283  GET_CALLER_PC_BP_SP;
284  (void)sp;
285  PrintWarning(pc, bp);
286  Printf("Exiting\n");
287  Die();
288}
289
290void __msan_init() {
291  if (msan_inited) return;
292  msan_init_is_running = 1;
293  SanitizerToolName = "MemorySanitizer";
294
295  SetDieCallback(MsanDie);
296  InitTlsSize();
297
298  const char *msan_options = GetEnv("MSAN_OPTIONS");
299  InitializeFlags(&msan_flags, msan_options);
300  __sanitizer_set_report_path(common_flags()->log_path);
301
302  InitializeInterceptors();
303  InstallAtExitHandler(); // Needs __cxa_atexit interceptor.
304
305  if (MSAN_REPLACE_OPERATORS_NEW_AND_DELETE)
306    ReplaceOperatorsNewAndDelete();
307  if (StackSizeIsUnlimited()) {
308    if (common_flags()->verbosity)
309      Printf("Unlimited stack, doing reexec\n");
310    // A reasonably large stack size. It is bigger than the usual 8Mb, because,
311    // well, the program could have been run with unlimited stack for a reason.
312    SetStackSizeLimitInBytes(32 * 1024 * 1024);
313    ReExec();
314  }
315
316  if (common_flags()->verbosity)
317    Printf("MSAN_OPTIONS: %s\n", msan_options ? msan_options : "<empty>");
318
319  msan_running_under_dr = IsRunningUnderDr();
320  __msan_clear_on_return();
321  if (__msan_get_track_origins() && common_flags()->verbosity > 0)
322    Printf("msan_track_origins\n");
323  if (!InitShadow(/* prot1 */ false, /* prot2 */ true, /* map_shadow */ true,
324                  __msan_get_track_origins())) {
325    // FIXME: prot1 = false is only required when running under DR.
326    Printf("FATAL: MemorySanitizer can not mmap the shadow memory.\n");
327    Printf("FATAL: Make sure to compile with -fPIE and to link with -pie.\n");
328    Printf("FATAL: Disabling ASLR is known to cause this error.\n");
329    Printf("FATAL: If running under GDB, try "
330           "'set disable-randomization off'.\n");
331    DumpProcessMap();
332    Die();
333  }
334
335  const char *external_symbolizer = common_flags()->external_symbolizer_path;
336  bool external_symbolizer_started =
337      Symbolizer::Init(external_symbolizer)->IsExternalAvailable();
338  if (external_symbolizer && external_symbolizer[0]) {
339    CHECK(external_symbolizer_started);
340  }
341  Symbolizer::Get()->AddHooks(EnterSymbolizer, ExitSymbolizer);
342
343  GetThreadStackTopAndBottom(/* at_initialization */true,
344                             &__msan_stack_bounds.stack_top,
345                             &__msan_stack_bounds.stack_bottom);
346  if (common_flags()->verbosity)
347    Printf("MemorySanitizer init done\n");
348  msan_init_is_running = 0;
349  msan_inited = 1;
350}
351
352void __msan_set_exit_code(int exit_code) {
353  flags()->exit_code = exit_code;
354}
355
356void __msan_set_keep_going(int keep_going) {
357  flags()->halt_on_error = !keep_going;
358}
359
360void __msan_set_expect_umr(int expect_umr) {
361  if (expect_umr) {
362    msan_expected_umr_found = 0;
363  } else if (!msan_expected_umr_found) {
364    GET_CALLER_PC_BP_SP;
365    (void)sp;
366    StackTrace stack;
367    GetStackTrace(&stack, kStackTraceMax, pc, bp,
368                  common_flags()->fast_unwind_on_fatal);
369    ReportExpectedUMRNotFound(&stack);
370    Die();
371  }
372  msan_expect_umr = expect_umr;
373}
374
375void __msan_print_shadow(const void *x, uptr size) {
376  if (!MEM_IS_APP(x)) {
377    Printf("Not a valid application address: %p\n", x);
378    return;
379  }
380  unsigned char *s = (unsigned char*)MEM_TO_SHADOW(x);
381  u32 *o = (u32*)MEM_TO_ORIGIN(x);
382  for (uptr i = 0; i < size; i++) {
383    Printf("%x%x ", s[i] >> 4, s[i] & 0xf);
384  }
385  Printf("\n");
386  if (__msan_get_track_origins()) {
387    for (uptr i = 0; i < size / 4; i++) {
388      Printf(" o: %x ", o[i]);
389    }
390    Printf("\n");
391  }
392}
393
394void __msan_print_param_shadow() {
395  for (int i = 0; i < 16; i++) {
396    Printf("#%d:%zx ", i, __msan_param_tls[i]);
397  }
398  Printf("\n");
399}
400
401sptr __msan_test_shadow(const void *x, uptr size) {
402  unsigned char *s = (unsigned char*)MEM_TO_SHADOW((uptr)x);
403  for (uptr i = 0; i < size; ++i)
404    if (s[i])
405      return i;
406  return -1;
407}
408
409int __msan_set_poison_in_malloc(int do_poison) {
410  int old = flags()->poison_in_malloc;
411  flags()->poison_in_malloc = do_poison;
412  return old;
413}
414
415int  __msan_has_dynamic_component() {
416  return msan_running_under_dr;
417}
418
419NOINLINE
420void __msan_clear_on_return() {
421  __msan_param_tls[0] = 0;
422}
423
424static void* get_tls_base() {
425  u64 p;
426  asm("mov %%fs:0, %0"
427      : "=r"(p) ::);
428  return (void*)p;
429}
430
431int __msan_get_retval_tls_offset() {
432  // volatile here is needed to avoid UB, because the compiler thinks that we
433  // are doing address arithmetics on unrelated pointers, and takes some
434  // shortcuts
435  volatile sptr retval_tls_p = (sptr)&__msan_retval_tls;
436  volatile sptr tls_base_p = (sptr)get_tls_base();
437  return retval_tls_p - tls_base_p;
438}
439
440int __msan_get_param_tls_offset() {
441  // volatile here is needed to avoid UB, because the compiler thinks that we
442  // are doing address arithmetics on unrelated pointers, and takes some
443  // shortcuts
444  volatile sptr param_tls_p = (sptr)&__msan_param_tls;
445  volatile sptr tls_base_p = (sptr)get_tls_base();
446  return param_tls_p - tls_base_p;
447}
448
449void __msan_partial_poison(const void* data, void* shadow, uptr size) {
450  internal_memcpy((void*)MEM_TO_SHADOW((uptr)data), shadow, size);
451}
452
453void __msan_load_unpoisoned(void *src, uptr size, void *dst) {
454  internal_memcpy(dst, src, size);
455  __msan_unpoison(dst, size);
456}
457
458void __msan_set_origin(const void *a, uptr size, u32 origin) {
459  // Origin mapping is 4 bytes per 4 bytes of application memory.
460  // Here we extend the range such that its left and right bounds are both
461  // 4 byte aligned.
462  if (!__msan_get_track_origins()) return;
463  uptr x = MEM_TO_ORIGIN((uptr)a);
464  uptr beg = x & ~3UL;  // align down.
465  uptr end = (x + size + 3) & ~3UL;  // align up.
466  u64 origin64 = ((u64)origin << 32) | origin;
467  // This is like memset, but the value is 32-bit. We unroll by 2 two write
468  // 64-bits at once. May want to unroll further to get 128-bit stores.
469  if (beg & 7ULL) {
470    *(u32*)beg = origin;
471    beg += 4;
472  }
473  for (uptr addr = beg; addr < (end & ~7UL); addr += 8)
474    *(u64*)addr = origin64;
475  if (end & 7ULL)
476    *(u32*)(end - 4) = origin;
477}
478
479// 'descr' is created at compile time and contains '----' in the beginning.
480// When we see descr for the first time we replace '----' with a uniq id
481// and set the origin to (id | (31-th bit)).
482void __msan_set_alloca_origin(void *a, uptr size, const char *descr) {
483  __msan_set_alloca_origin4(a, size, descr, 0);
484}
485
486void __msan_set_alloca_origin4(void *a, uptr size, const char *descr, uptr pc) {
487  static const u32 dash = '-';
488  static const u32 first_timer =
489      dash + (dash << 8) + (dash << 16) + (dash << 24);
490  u32 *id_ptr = (u32*)descr;
491  bool print = false;  // internal_strstr(descr + 4, "AllocaTOTest") != 0;
492  u32 id = *id_ptr;
493  if (id == first_timer) {
494    id = atomic_fetch_add(&NumStackOriginDescrs,
495                          1, memory_order_relaxed);
496    *id_ptr = id;
497    CHECK_LT(id, kNumStackOriginDescrs);
498    StackOriginDescr[id] = descr + 4;
499    StackOriginPC[id] = pc;
500    if (print)
501      Printf("First time: id=%d %s %p \n", id, descr + 4, pc);
502  }
503  id |= 1U << 31;
504  if (print)
505    Printf("__msan_set_alloca_origin: descr=%s id=%x\n", descr + 4, id);
506  __msan_set_origin(a, size, id);
507}
508
509const char *__msan_get_origin_descr_if_stack(u32 id) {
510  return GetOriginDescrIfStack(id, 0);
511}
512
513u32 __msan_get_origin(const void *a) {
514  if (!__msan_get_track_origins()) return 0;
515  uptr x = (uptr)a;
516  uptr aligned = x & ~3ULL;
517  uptr origin_ptr = MEM_TO_ORIGIN(aligned);
518  return *(u32*)origin_ptr;
519}
520
521u32 __msan_get_umr_origin() {
522  return __msan_origin_tls;
523}
524
525u16 __sanitizer_unaligned_load16(const uu16 *p) {
526  __msan_retval_tls[0] = *(uu16 *)MEM_TO_SHADOW((uptr)p);
527  if (__msan_get_track_origins())
528    __msan_retval_origin_tls = *(uu32 *)MEM_TO_ORIGIN((uptr)p);
529  return *p;
530}
531u32 __sanitizer_unaligned_load32(const uu32 *p) {
532  __msan_retval_tls[0] = *(uu32 *)MEM_TO_SHADOW((uptr)p);
533  if (__msan_get_track_origins())
534    __msan_retval_origin_tls = *(uu32 *)MEM_TO_ORIGIN((uptr)p);
535  return *p;
536}
537u64 __sanitizer_unaligned_load64(const uu64 *p) {
538  __msan_retval_tls[0] = *(uu64 *)MEM_TO_SHADOW((uptr)p);
539  if (__msan_get_track_origins())
540    __msan_retval_origin_tls = *(uu32 *)MEM_TO_ORIGIN((uptr)p);
541  return *p;
542}
543void __sanitizer_unaligned_store16(uu16 *p, u16 x) {
544  *(uu16 *)MEM_TO_SHADOW((uptr)p) = __msan_param_tls[1];
545  if (__msan_get_track_origins())
546    *(uu32 *)MEM_TO_ORIGIN((uptr)p) = __msan_param_origin_tls[1];
547  *p = x;
548}
549void __sanitizer_unaligned_store32(uu32 *p, u32 x) {
550  *(uu32 *)MEM_TO_SHADOW((uptr)p) = __msan_param_tls[1];
551  if (__msan_get_track_origins())
552    *(uu32 *)MEM_TO_ORIGIN((uptr)p) = __msan_param_origin_tls[1];
553  *p = x;
554}
555void __sanitizer_unaligned_store64(uu64 *p, u64 x) {
556  *(uu64 *)MEM_TO_SHADOW((uptr)p) = __msan_param_tls[1];
557  if (__msan_get_track_origins())
558    *(uu32 *)MEM_TO_ORIGIN((uptr)p) = __msan_param_origin_tls[1];
559  *p = x;
560}
561
562#if !SANITIZER_SUPPORTS_WEAK_HOOKS
563extern "C" {
564SANITIZER_INTERFACE_ATTRIBUTE SANITIZER_WEAK_ATTRIBUTE
565const char* __msan_default_options() { return ""; }
566}  // extern "C"
567#endif
568
569