asan_globals.cpp revision 360784
1//===-- asan_globals.cpp --------------------------------------------------===//
2//
3// Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4// See https://llvm.org/LICENSE.txt for license information.
5// SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6//
7//===----------------------------------------------------------------------===//
8//
9// This file is a part of AddressSanitizer, an address sanity checker.
10//
11// Handle globals.
12//===----------------------------------------------------------------------===//
13
14#include "asan_interceptors.h"
15#include "asan_internal.h"
16#include "asan_mapping.h"
17#include "asan_poisoning.h"
18#include "asan_report.h"
19#include "asan_stack.h"
20#include "asan_stats.h"
21#include "asan_suppressions.h"
22#include "asan_thread.h"
23#include "sanitizer_common/sanitizer_common.h"
24#include "sanitizer_common/sanitizer_mutex.h"
25#include "sanitizer_common/sanitizer_placement_new.h"
26#include "sanitizer_common/sanitizer_stackdepot.h"
27#include "sanitizer_common/sanitizer_symbolizer.h"
28
29namespace __asan {
30
31typedef __asan_global Global;
32
33struct ListOfGlobals {
34  const Global *g;
35  ListOfGlobals *next;
36};
37
38static BlockingMutex mu_for_globals(LINKER_INITIALIZED);
39static LowLevelAllocator allocator_for_globals;
40static ListOfGlobals *list_of_all_globals;
41
42static const int kDynamicInitGlobalsInitialCapacity = 512;
43struct DynInitGlobal {
44  Global g;
45  bool initialized;
46};
47typedef InternalMmapVector<DynInitGlobal> VectorOfGlobals;
48// Lazy-initialized and never deleted.
49static VectorOfGlobals *dynamic_init_globals;
50
51// We want to remember where a certain range of globals was registered.
52struct GlobalRegistrationSite {
53  u32 stack_id;
54  Global *g_first, *g_last;
55};
56typedef InternalMmapVector<GlobalRegistrationSite> GlobalRegistrationSiteVector;
57static GlobalRegistrationSiteVector *global_registration_site_vector;
58
59ALWAYS_INLINE void PoisonShadowForGlobal(const Global *g, u8 value) {
60  FastPoisonShadow(g->beg, g->size_with_redzone, value);
61}
62
63ALWAYS_INLINE void PoisonRedZones(const Global &g) {
64  uptr aligned_size = RoundUpTo(g.size, SHADOW_GRANULARITY);
65  FastPoisonShadow(g.beg + aligned_size, g.size_with_redzone - aligned_size,
66                   kAsanGlobalRedzoneMagic);
67  if (g.size != aligned_size) {
68    FastPoisonShadowPartialRightRedzone(
69        g.beg + RoundDownTo(g.size, SHADOW_GRANULARITY),
70        g.size % SHADOW_GRANULARITY,
71        SHADOW_GRANULARITY,
72        kAsanGlobalRedzoneMagic);
73  }
74}
75
76const uptr kMinimalDistanceFromAnotherGlobal = 64;
77
78static bool IsAddressNearGlobal(uptr addr, const __asan_global &g) {
79  if (addr <= g.beg - kMinimalDistanceFromAnotherGlobal) return false;
80  if (addr >= g.beg + g.size_with_redzone) return false;
81  return true;
82}
83
84static void ReportGlobal(const Global &g, const char *prefix) {
85  Report(
86      "%s Global[%p]: beg=%p size=%zu/%zu name=%s module=%s dyn_init=%zu "
87      "odr_indicator=%p\n",
88      prefix, &g, (void *)g.beg, g.size, g.size_with_redzone, g.name,
89      g.module_name, g.has_dynamic_init, (void *)g.odr_indicator);
90  if (g.location) {
91    Report("  location (%p): name=%s[%p], %d %d\n", g.location,
92           g.location->filename, g.location->filename, g.location->line_no,
93           g.location->column_no);
94  }
95}
96
97static u32 FindRegistrationSite(const Global *g) {
98  mu_for_globals.CheckLocked();
99  CHECK(global_registration_site_vector);
100  for (uptr i = 0, n = global_registration_site_vector->size(); i < n; i++) {
101    GlobalRegistrationSite &grs = (*global_registration_site_vector)[i];
102    if (g >= grs.g_first && g <= grs.g_last)
103      return grs.stack_id;
104  }
105  return 0;
106}
107
108int GetGlobalsForAddress(uptr addr, Global *globals, u32 *reg_sites,
109                         int max_globals) {
110  if (!flags()->report_globals) return 0;
111  BlockingMutexLock lock(&mu_for_globals);
112  int res = 0;
113  for (ListOfGlobals *l = list_of_all_globals; l; l = l->next) {
114    const Global &g = *l->g;
115    if (flags()->report_globals >= 2)
116      ReportGlobal(g, "Search");
117    if (IsAddressNearGlobal(addr, g)) {
118      internal_memcpy(&globals[res], &g, sizeof(g));
119      if (reg_sites)
120        reg_sites[res] = FindRegistrationSite(&g);
121      res++;
122      if (res == max_globals)
123        break;
124    }
125  }
126  return res;
127}
128
129enum GlobalSymbolState {
130  UNREGISTERED = 0,
131  REGISTERED = 1
132};
133
134// Check ODR violation for given global G via special ODR indicator. We use
135// this method in case compiler instruments global variables through their
136// local aliases.
137static void CheckODRViolationViaIndicator(const Global *g) {
138  // Instrumentation requests to skip ODR check.
139  if (g->odr_indicator == UINTPTR_MAX)
140    return;
141  u8 *odr_indicator = reinterpret_cast<u8 *>(g->odr_indicator);
142  if (*odr_indicator == UNREGISTERED) {
143    *odr_indicator = REGISTERED;
144    return;
145  }
146  // If *odr_indicator is DEFINED, some module have already registered
147  // externally visible symbol with the same name. This is an ODR violation.
148  for (ListOfGlobals *l = list_of_all_globals; l; l = l->next) {
149    if (g->odr_indicator == l->g->odr_indicator &&
150        (flags()->detect_odr_violation >= 2 || g->size != l->g->size) &&
151        !IsODRViolationSuppressed(g->name))
152      ReportODRViolation(g, FindRegistrationSite(g),
153                         l->g, FindRegistrationSite(l->g));
154  }
155}
156
157// Check ODR violation for given global G by checking if it's already poisoned.
158// We use this method in case compiler doesn't use private aliases for global
159// variables.
160static void CheckODRViolationViaPoisoning(const Global *g) {
161  if (__asan_region_is_poisoned(g->beg, g->size_with_redzone)) {
162    // This check may not be enough: if the first global is much larger
163    // the entire redzone of the second global may be within the first global.
164    for (ListOfGlobals *l = list_of_all_globals; l; l = l->next) {
165      if (g->beg == l->g->beg &&
166          (flags()->detect_odr_violation >= 2 || g->size != l->g->size) &&
167          !IsODRViolationSuppressed(g->name))
168        ReportODRViolation(g, FindRegistrationSite(g),
169                           l->g, FindRegistrationSite(l->g));
170    }
171  }
172}
173
174// Clang provides two different ways for global variables protection:
175// it can poison the global itself or its private alias. In former
176// case we may poison same symbol multiple times, that can help us to
177// cheaply detect ODR violation: if we try to poison an already poisoned
178// global, we have ODR violation error.
179// In latter case, we poison each symbol exactly once, so we use special
180// indicator symbol to perform similar check.
181// In either case, compiler provides a special odr_indicator field to Global
182// structure, that can contain two kinds of values:
183//   1) Non-zero value. In this case, odr_indicator is an address of
184//      corresponding indicator variable for given global.
185//   2) Zero. This means that we don't use private aliases for global variables
186//      and can freely check ODR violation with the first method.
187//
188// This routine chooses between two different methods of ODR violation
189// detection.
190static inline bool UseODRIndicator(const Global *g) {
191  return g->odr_indicator > 0;
192}
193
194// Register a global variable.
195// This function may be called more than once for every global
196// so we store the globals in a map.
197static void RegisterGlobal(const Global *g) {
198  CHECK(asan_inited);
199  if (flags()->report_globals >= 2)
200    ReportGlobal(*g, "Added");
201  CHECK(flags()->report_globals);
202  CHECK(AddrIsInMem(g->beg));
203  if (!AddrIsAlignedByGranularity(g->beg)) {
204    Report("The following global variable is not properly aligned.\n");
205    Report("This may happen if another global with the same name\n");
206    Report("resides in another non-instrumented module.\n");
207    Report("Or the global comes from a C file built w/o -fno-common.\n");
208    Report("In either case this is likely an ODR violation bug,\n");
209    Report("but AddressSanitizer can not provide more details.\n");
210    ReportODRViolation(g, FindRegistrationSite(g), g, FindRegistrationSite(g));
211    CHECK(AddrIsAlignedByGranularity(g->beg));
212  }
213  CHECK(AddrIsAlignedByGranularity(g->size_with_redzone));
214  if (flags()->detect_odr_violation) {
215    // Try detecting ODR (One Definition Rule) violation, i.e. the situation
216    // where two globals with the same name are defined in different modules.
217    if (UseODRIndicator(g))
218      CheckODRViolationViaIndicator(g);
219    else
220      CheckODRViolationViaPoisoning(g);
221  }
222  if (CanPoisonMemory())
223    PoisonRedZones(*g);
224  ListOfGlobals *l = new(allocator_for_globals) ListOfGlobals;
225  l->g = g;
226  l->next = list_of_all_globals;
227  list_of_all_globals = l;
228  if (g->has_dynamic_init) {
229    if (!dynamic_init_globals) {
230      dynamic_init_globals = new (allocator_for_globals) VectorOfGlobals;
231      dynamic_init_globals->reserve(kDynamicInitGlobalsInitialCapacity);
232    }
233    DynInitGlobal dyn_global = { *g, false };
234    dynamic_init_globals->push_back(dyn_global);
235  }
236}
237
238static void UnregisterGlobal(const Global *g) {
239  CHECK(asan_inited);
240  if (flags()->report_globals >= 2)
241    ReportGlobal(*g, "Removed");
242  CHECK(flags()->report_globals);
243  CHECK(AddrIsInMem(g->beg));
244  CHECK(AddrIsAlignedByGranularity(g->beg));
245  CHECK(AddrIsAlignedByGranularity(g->size_with_redzone));
246  if (CanPoisonMemory())
247    PoisonShadowForGlobal(g, 0);
248  // We unpoison the shadow memory for the global but we do not remove it from
249  // the list because that would require O(n^2) time with the current list
250  // implementation. It might not be worth doing anyway.
251
252  // Release ODR indicator.
253  if (UseODRIndicator(g) && g->odr_indicator != UINTPTR_MAX) {
254    u8 *odr_indicator = reinterpret_cast<u8 *>(g->odr_indicator);
255    *odr_indicator = UNREGISTERED;
256  }
257}
258
259void StopInitOrderChecking() {
260  BlockingMutexLock lock(&mu_for_globals);
261  if (!flags()->check_initialization_order || !dynamic_init_globals)
262    return;
263  flags()->check_initialization_order = false;
264  for (uptr i = 0, n = dynamic_init_globals->size(); i < n; ++i) {
265    DynInitGlobal &dyn_g = (*dynamic_init_globals)[i];
266    const Global *g = &dyn_g.g;
267    // Unpoison the whole global.
268    PoisonShadowForGlobal(g, 0);
269    // Poison redzones back.
270    PoisonRedZones(*g);
271  }
272}
273
274static bool IsASCII(unsigned char c) { return /*0x00 <= c &&*/ c <= 0x7F; }
275
276const char *MaybeDemangleGlobalName(const char *name) {
277  // We can spoil names of globals with C linkage, so use an heuristic
278  // approach to check if the name should be demangled.
279  bool should_demangle = false;
280  if (name[0] == '_' && name[1] == 'Z')
281    should_demangle = true;
282  else if (SANITIZER_WINDOWS && name[0] == '\01' && name[1] == '?')
283    should_demangle = true;
284
285  return should_demangle ? Symbolizer::GetOrInit()->Demangle(name) : name;
286}
287
288// Check if the global is a zero-terminated ASCII string. If so, print it.
289void PrintGlobalNameIfASCII(InternalScopedString *str, const __asan_global &g) {
290  for (uptr p = g.beg; p < g.beg + g.size - 1; p++) {
291    unsigned char c = *(unsigned char *)p;
292    if (c == '\0' || !IsASCII(c)) return;
293  }
294  if (*(char *)(g.beg + g.size - 1) != '\0') return;
295  str->append("  '%s' is ascii string '%s'\n", MaybeDemangleGlobalName(g.name),
296              (char *)g.beg);
297}
298
299static const char *GlobalFilename(const __asan_global &g) {
300  const char *res = g.module_name;
301  // Prefer the filename from source location, if is available.
302  if (g.location) res = g.location->filename;
303  CHECK(res);
304  return res;
305}
306
307void PrintGlobalLocation(InternalScopedString *str, const __asan_global &g) {
308  str->append("%s", GlobalFilename(g));
309  if (!g.location) return;
310  if (g.location->line_no) str->append(":%d", g.location->line_no);
311  if (g.location->column_no) str->append(":%d", g.location->column_no);
312}
313
314} // namespace __asan
315
316// ---------------------- Interface ---------------- {{{1
317using namespace __asan;
318
319// Apply __asan_register_globals to all globals found in the same loaded
320// executable or shared library as `flag'. The flag tracks whether globals have
321// already been registered or not for this image.
322void __asan_register_image_globals(uptr *flag) {
323  if (*flag)
324    return;
325  AsanApplyToGlobals(__asan_register_globals, flag);
326  *flag = 1;
327}
328
329// This mirrors __asan_register_image_globals.
330void __asan_unregister_image_globals(uptr *flag) {
331  if (!*flag)
332    return;
333  AsanApplyToGlobals(__asan_unregister_globals, flag);
334  *flag = 0;
335}
336
337void __asan_register_elf_globals(uptr *flag, void *start, void *stop) {
338  if (*flag) return;
339  if (!start) return;
340  CHECK_EQ(0, ((uptr)stop - (uptr)start) % sizeof(__asan_global));
341  __asan_global *globals_start = (__asan_global*)start;
342  __asan_global *globals_stop = (__asan_global*)stop;
343  __asan_register_globals(globals_start, globals_stop - globals_start);
344  *flag = 1;
345}
346
347void __asan_unregister_elf_globals(uptr *flag, void *start, void *stop) {
348  if (!*flag) return;
349  if (!start) return;
350  CHECK_EQ(0, ((uptr)stop - (uptr)start) % sizeof(__asan_global));
351  __asan_global *globals_start = (__asan_global*)start;
352  __asan_global *globals_stop = (__asan_global*)stop;
353  __asan_unregister_globals(globals_start, globals_stop - globals_start);
354  *flag = 0;
355}
356
357// Register an array of globals.
358void __asan_register_globals(__asan_global *globals, uptr n) {
359  if (!flags()->report_globals) return;
360  GET_STACK_TRACE_MALLOC;
361  u32 stack_id = StackDepotPut(stack);
362  BlockingMutexLock lock(&mu_for_globals);
363  if (!global_registration_site_vector) {
364    global_registration_site_vector =
365        new (allocator_for_globals) GlobalRegistrationSiteVector;
366    global_registration_site_vector->reserve(128);
367  }
368  GlobalRegistrationSite site = {stack_id, &globals[0], &globals[n - 1]};
369  global_registration_site_vector->push_back(site);
370  if (flags()->report_globals >= 2) {
371    PRINT_CURRENT_STACK();
372    Printf("=== ID %d; %p %p\n", stack_id, &globals[0], &globals[n - 1]);
373  }
374  for (uptr i = 0; i < n; i++) {
375    if (SANITIZER_WINDOWS && globals[i].beg == 0) {
376      // The MSVC incremental linker may pad globals out to 256 bytes. As long
377      // as __asan_global is less than 256 bytes large and its size is a power
378      // of two, we can skip over the padding.
379      static_assert(
380          sizeof(__asan_global) < 256 &&
381              (sizeof(__asan_global) & (sizeof(__asan_global) - 1)) == 0,
382          "sizeof(__asan_global) incompatible with incremental linker padding");
383      // If these are padding bytes, the rest of the global should be zero.
384      CHECK(globals[i].size == 0 && globals[i].size_with_redzone == 0 &&
385            globals[i].name == nullptr && globals[i].module_name == nullptr &&
386            globals[i].odr_indicator == 0);
387      continue;
388    }
389    RegisterGlobal(&globals[i]);
390  }
391
392  // Poison the metadata. It should not be accessible to user code.
393  PoisonShadow(reinterpret_cast<uptr>(globals), n * sizeof(__asan_global),
394               kAsanGlobalRedzoneMagic);
395}
396
397// Unregister an array of globals.
398// We must do this when a shared objects gets dlclosed.
399void __asan_unregister_globals(__asan_global *globals, uptr n) {
400  if (!flags()->report_globals) return;
401  BlockingMutexLock lock(&mu_for_globals);
402  for (uptr i = 0; i < n; i++) {
403    if (SANITIZER_WINDOWS && globals[i].beg == 0) {
404      // Skip globals that look like padding from the MSVC incremental linker.
405      // See comment in __asan_register_globals.
406      continue;
407    }
408    UnregisterGlobal(&globals[i]);
409  }
410
411  // Unpoison the metadata.
412  PoisonShadow(reinterpret_cast<uptr>(globals), n * sizeof(__asan_global), 0);
413}
414
415// This method runs immediately prior to dynamic initialization in each TU,
416// when all dynamically initialized globals are unpoisoned.  This method
417// poisons all global variables not defined in this TU, so that a dynamic
418// initializer can only touch global variables in the same TU.
419void __asan_before_dynamic_init(const char *module_name) {
420  if (!flags()->check_initialization_order ||
421      !CanPoisonMemory() ||
422      !dynamic_init_globals)
423    return;
424  bool strict_init_order = flags()->strict_init_order;
425  CHECK(module_name);
426  CHECK(asan_inited);
427  BlockingMutexLock lock(&mu_for_globals);
428  if (flags()->report_globals >= 3)
429    Printf("DynInitPoison module: %s\n", module_name);
430  for (uptr i = 0, n = dynamic_init_globals->size(); i < n; ++i) {
431    DynInitGlobal &dyn_g = (*dynamic_init_globals)[i];
432    const Global *g = &dyn_g.g;
433    if (dyn_g.initialized)
434      continue;
435    if (g->module_name != module_name)
436      PoisonShadowForGlobal(g, kAsanInitializationOrderMagic);
437    else if (!strict_init_order)
438      dyn_g.initialized = true;
439  }
440}
441
442// This method runs immediately after dynamic initialization in each TU, when
443// all dynamically initialized globals except for those defined in the current
444// TU are poisoned.  It simply unpoisons all dynamically initialized globals.
445void __asan_after_dynamic_init() {
446  if (!flags()->check_initialization_order ||
447      !CanPoisonMemory() ||
448      !dynamic_init_globals)
449    return;
450  CHECK(asan_inited);
451  BlockingMutexLock lock(&mu_for_globals);
452  // FIXME: Optionally report that we're unpoisoning globals from a module.
453  for (uptr i = 0, n = dynamic_init_globals->size(); i < n; ++i) {
454    DynInitGlobal &dyn_g = (*dynamic_init_globals)[i];
455    const Global *g = &dyn_g.g;
456    if (!dyn_g.initialized) {
457      // Unpoison the whole global.
458      PoisonShadowForGlobal(g, 0);
459      // Poison redzones back.
460      PoisonRedZones(*g);
461    }
462  }
463}
464