1 //===-- asan_globals.cpp --------------------------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file is a part of AddressSanitizer, an address sanity checker.
10 //
11 // Handle globals.
12 //===----------------------------------------------------------------------===//
13
14 #include "asan_interceptors.h"
15 #include "asan_internal.h"
16 #include "asan_mapping.h"
17 #include "asan_poisoning.h"
18 #include "asan_report.h"
19 #include "asan_stack.h"
20 #include "asan_stats.h"
21 #include "asan_suppressions.h"
22 #include "asan_thread.h"
23 #include "sanitizer_common/sanitizer_common.h"
24 #include "sanitizer_common/sanitizer_mutex.h"
25 #include "sanitizer_common/sanitizer_placement_new.h"
26 #include "sanitizer_common/sanitizer_stackdepot.h"
27 #include "sanitizer_common/sanitizer_symbolizer.h"
28
29 namespace __asan {
30
31 typedef __asan_global Global;
32
33 struct ListOfGlobals {
34 const Global *g;
35 ListOfGlobals *next;
36 };
37
38 static Mutex mu_for_globals;
39 static ListOfGlobals *list_of_all_globals;
40
41 static const int kDynamicInitGlobalsInitialCapacity = 512;
42 struct DynInitGlobal {
43 Global g;
44 bool initialized;
45 };
46 typedef InternalMmapVector<DynInitGlobal> VectorOfGlobals;
47 // Lazy-initialized and never deleted.
48 static VectorOfGlobals *dynamic_init_globals;
49
50 // We want to remember where a certain range of globals was registered.
51 struct GlobalRegistrationSite {
52 u32 stack_id;
53 Global *g_first, *g_last;
54 };
55 typedef InternalMmapVector<GlobalRegistrationSite> GlobalRegistrationSiteVector;
56 static GlobalRegistrationSiteVector *global_registration_site_vector;
57
PoisonShadowForGlobal(const Global * g,u8 value)58 ALWAYS_INLINE void PoisonShadowForGlobal(const Global *g, u8 value) {
59 FastPoisonShadow(g->beg, g->size_with_redzone, value);
60 }
61
PoisonRedZones(const Global & g)62 ALWAYS_INLINE void PoisonRedZones(const Global &g) {
63 uptr aligned_size = RoundUpTo(g.size, ASAN_SHADOW_GRANULARITY);
64 FastPoisonShadow(g.beg + aligned_size, g.size_with_redzone - aligned_size,
65 kAsanGlobalRedzoneMagic);
66 if (g.size != aligned_size) {
67 FastPoisonShadowPartialRightRedzone(
68 g.beg + RoundDownTo(g.size, ASAN_SHADOW_GRANULARITY),
69 g.size % ASAN_SHADOW_GRANULARITY, ASAN_SHADOW_GRANULARITY,
70 kAsanGlobalRedzoneMagic);
71 }
72 }
73
74 const uptr kMinimalDistanceFromAnotherGlobal = 64;
75
IsAddressNearGlobal(uptr addr,const __asan_global & g)76 static bool IsAddressNearGlobal(uptr addr, const __asan_global &g) {
77 if (addr <= g.beg - kMinimalDistanceFromAnotherGlobal) return false;
78 if (addr >= g.beg + g.size_with_redzone) return false;
79 return true;
80 }
81
ReportGlobal(const Global & g,const char * prefix)82 static void ReportGlobal(const Global &g, const char *prefix) {
83 DataInfo info;
84 bool symbolized = Symbolizer::GetOrInit()->SymbolizeData(g.beg, &info);
85 Report(
86 "%s Global[%p]: beg=%p size=%zu/%zu name=%s source=%s module=%s "
87 "dyn_init=%zu "
88 "odr_indicator=%p\n",
89 prefix, (void *)&g, (void *)g.beg, g.size, g.size_with_redzone, g.name,
90 g.module_name, (symbolized ? info.module : "?"), g.has_dynamic_init,
91 (void *)g.odr_indicator);
92
93 if (symbolized && info.line != 0) {
94 Report(" location: name=%s, %d\n", info.file, static_cast<int>(info.line));
95 } else if (g.gcc_location != 0) {
96 // Fallback to Global::gcc_location
97 Report(" location: name=%s, %d\n", g.gcc_location->filename, g.gcc_location->line_no);
98 }
99 }
100
FindRegistrationSite(const Global * g)101 static u32 FindRegistrationSite(const Global *g) {
102 mu_for_globals.CheckLocked();
103 CHECK(global_registration_site_vector);
104 for (uptr i = 0, n = global_registration_site_vector->size(); i < n; i++) {
105 GlobalRegistrationSite &grs = (*global_registration_site_vector)[i];
106 if (g >= grs.g_first && g <= grs.g_last)
107 return grs.stack_id;
108 }
109 return 0;
110 }
111
GetGlobalsForAddress(uptr addr,Global * globals,u32 * reg_sites,int max_globals)112 int GetGlobalsForAddress(uptr addr, Global *globals, u32 *reg_sites,
113 int max_globals) {
114 if (!flags()->report_globals) return 0;
115 Lock lock(&mu_for_globals);
116 int res = 0;
117 for (ListOfGlobals *l = list_of_all_globals; l; l = l->next) {
118 const Global &g = *l->g;
119 if (flags()->report_globals >= 2)
120 ReportGlobal(g, "Search");
121 if (IsAddressNearGlobal(addr, g)) {
122 internal_memcpy(&globals[res], &g, sizeof(g));
123 if (reg_sites)
124 reg_sites[res] = FindRegistrationSite(&g);
125 res++;
126 if (res == max_globals)
127 break;
128 }
129 }
130 return res;
131 }
132
133 enum GlobalSymbolState {
134 UNREGISTERED = 0,
135 REGISTERED = 1
136 };
137
138 // Check ODR violation for given global G via special ODR indicator. We use
139 // this method in case compiler instruments global variables through their
140 // local aliases.
CheckODRViolationViaIndicator(const Global * g)141 static void CheckODRViolationViaIndicator(const Global *g) {
142 // Instrumentation requests to skip ODR check.
143 if (g->odr_indicator == UINTPTR_MAX)
144 return;
145 u8 *odr_indicator = reinterpret_cast<u8 *>(g->odr_indicator);
146 if (*odr_indicator == UNREGISTERED) {
147 *odr_indicator = REGISTERED;
148 return;
149 }
150 // If *odr_indicator is DEFINED, some module have already registered
151 // externally visible symbol with the same name. This is an ODR violation.
152 for (ListOfGlobals *l = list_of_all_globals; l; l = l->next) {
153 if (g->odr_indicator == l->g->odr_indicator &&
154 (flags()->detect_odr_violation >= 2 || g->size != l->g->size) &&
155 !IsODRViolationSuppressed(g->name))
156 ReportODRViolation(g, FindRegistrationSite(g),
157 l->g, FindRegistrationSite(l->g));
158 }
159 }
160
161 // Check ODR violation for given global G by checking if it's already poisoned.
162 // We use this method in case compiler doesn't use private aliases for global
163 // variables.
CheckODRViolationViaPoisoning(const Global * g)164 static void CheckODRViolationViaPoisoning(const Global *g) {
165 if (__asan_region_is_poisoned(g->beg, g->size_with_redzone)) {
166 // This check may not be enough: if the first global is much larger
167 // the entire redzone of the second global may be within the first global.
168 for (ListOfGlobals *l = list_of_all_globals; l; l = l->next) {
169 if (g->beg == l->g->beg &&
170 (flags()->detect_odr_violation >= 2 || g->size != l->g->size) &&
171 !IsODRViolationSuppressed(g->name))
172 ReportODRViolation(g, FindRegistrationSite(g),
173 l->g, FindRegistrationSite(l->g));
174 }
175 }
176 }
177
178 // Clang provides two different ways for global variables protection:
179 // it can poison the global itself or its private alias. In former
180 // case we may poison same symbol multiple times, that can help us to
181 // cheaply detect ODR violation: if we try to poison an already poisoned
182 // global, we have ODR violation error.
183 // In latter case, we poison each symbol exactly once, so we use special
184 // indicator symbol to perform similar check.
185 // In either case, compiler provides a special odr_indicator field to Global
186 // structure, that can contain two kinds of values:
187 // 1) Non-zero value. In this case, odr_indicator is an address of
188 // corresponding indicator variable for given global.
189 // 2) Zero. This means that we don't use private aliases for global variables
190 // and can freely check ODR violation with the first method.
191 //
192 // This routine chooses between two different methods of ODR violation
193 // detection.
UseODRIndicator(const Global * g)194 static inline bool UseODRIndicator(const Global *g) {
195 return g->odr_indicator > 0;
196 }
197
198 // Register a global variable.
199 // This function may be called more than once for every global
200 // so we store the globals in a map.
RegisterGlobal(const Global * g)201 static void RegisterGlobal(const Global *g) {
202 CHECK(AsanInited());
203 if (flags()->report_globals >= 2)
204 ReportGlobal(*g, "Added");
205 CHECK(flags()->report_globals);
206 CHECK(AddrIsInMem(g->beg));
207 if (!AddrIsAlignedByGranularity(g->beg)) {
208 Report("The following global variable is not properly aligned.\n");
209 Report("This may happen if another global with the same name\n");
210 Report("resides in another non-instrumented module.\n");
211 Report("Or the global comes from a C file built w/o -fno-common.\n");
212 Report("In either case this is likely an ODR violation bug,\n");
213 Report("but AddressSanitizer can not provide more details.\n");
214 ReportODRViolation(g, FindRegistrationSite(g), g, FindRegistrationSite(g));
215 CHECK(AddrIsAlignedByGranularity(g->beg));
216 }
217 CHECK(AddrIsAlignedByGranularity(g->size_with_redzone));
218 if (flags()->detect_odr_violation) {
219 // Try detecting ODR (One Definition Rule) violation, i.e. the situation
220 // where two globals with the same name are defined in different modules.
221 if (UseODRIndicator(g))
222 CheckODRViolationViaIndicator(g);
223 else
224 CheckODRViolationViaPoisoning(g);
225 }
226 if (CanPoisonMemory())
227 PoisonRedZones(*g);
228 ListOfGlobals *l = new (GetGlobalLowLevelAllocator()) ListOfGlobals;
229 l->g = g;
230 l->next = list_of_all_globals;
231 list_of_all_globals = l;
232 if (g->has_dynamic_init) {
233 if (!dynamic_init_globals) {
234 dynamic_init_globals = new (GetGlobalLowLevelAllocator()) VectorOfGlobals;
235 dynamic_init_globals->reserve(kDynamicInitGlobalsInitialCapacity);
236 }
237 DynInitGlobal dyn_global = { *g, false };
238 dynamic_init_globals->push_back(dyn_global);
239 }
240 }
241
UnregisterGlobal(const Global * g)242 static void UnregisterGlobal(const Global *g) {
243 CHECK(AsanInited());
244 if (flags()->report_globals >= 2)
245 ReportGlobal(*g, "Removed");
246 CHECK(flags()->report_globals);
247 CHECK(AddrIsInMem(g->beg));
248 CHECK(AddrIsAlignedByGranularity(g->beg));
249 CHECK(AddrIsAlignedByGranularity(g->size_with_redzone));
250 if (CanPoisonMemory())
251 PoisonShadowForGlobal(g, 0);
252 // We unpoison the shadow memory for the global but we do not remove it from
253 // the list because that would require O(n^2) time with the current list
254 // implementation. It might not be worth doing anyway.
255
256 // Release ODR indicator.
257 if (UseODRIndicator(g) && g->odr_indicator != UINTPTR_MAX) {
258 u8 *odr_indicator = reinterpret_cast<u8 *>(g->odr_indicator);
259 *odr_indicator = UNREGISTERED;
260 }
261 }
262
StopInitOrderChecking()263 void StopInitOrderChecking() {
264 Lock lock(&mu_for_globals);
265 if (!flags()->check_initialization_order || !dynamic_init_globals)
266 return;
267 flags()->check_initialization_order = false;
268 for (uptr i = 0, n = dynamic_init_globals->size(); i < n; ++i) {
269 DynInitGlobal &dyn_g = (*dynamic_init_globals)[i];
270 const Global *g = &dyn_g.g;
271 // Unpoison the whole global.
272 PoisonShadowForGlobal(g, 0);
273 // Poison redzones back.
274 PoisonRedZones(*g);
275 }
276 }
277
IsASCII(unsigned char c)278 static bool IsASCII(unsigned char c) { return /*0x00 <= c &&*/ c <= 0x7F; }
279
MaybeDemangleGlobalName(const char * name)280 const char *MaybeDemangleGlobalName(const char *name) {
281 // We can spoil names of globals with C linkage, so use an heuristic
282 // approach to check if the name should be demangled.
283 bool should_demangle = false;
284 if (name[0] == '_' && name[1] == 'Z')
285 should_demangle = true;
286 else if (SANITIZER_WINDOWS && name[0] == '\01' && name[1] == '?')
287 should_demangle = true;
288
289 return should_demangle ? Symbolizer::GetOrInit()->Demangle(name) : name;
290 }
291
292 // Check if the global is a zero-terminated ASCII string. If so, print it.
PrintGlobalNameIfASCII(InternalScopedString * str,const __asan_global & g)293 void PrintGlobalNameIfASCII(InternalScopedString *str, const __asan_global &g) {
294 for (uptr p = g.beg; p < g.beg + g.size - 1; p++) {
295 unsigned char c = *(unsigned char *)p;
296 if (c == '\0' || !IsASCII(c)) return;
297 }
298 if (*(char *)(g.beg + g.size - 1) != '\0') return;
299 str->AppendF(" '%s' is ascii string '%s'\n", MaybeDemangleGlobalName(g.name),
300 (char *)g.beg);
301 }
302
PrintGlobalLocation(InternalScopedString * str,const __asan_global & g,bool print_module_name)303 void PrintGlobalLocation(InternalScopedString *str, const __asan_global &g,
304 bool print_module_name) {
305 DataInfo info;
306 if (Symbolizer::GetOrInit()->SymbolizeData(g.beg, &info) && info.line != 0) {
307 str->AppendF("%s:%d", info.file, static_cast<int>(info.line));
308 } else if (g.gcc_location != 0) {
309 // Fallback to Global::gcc_location
310 str->AppendF("%s", g.gcc_location->filename ? g.gcc_location->filename
311 : g.module_name);
312 if (g.gcc_location->line_no)
313 str->AppendF(":%d", g.gcc_location->line_no);
314 if (g.gcc_location->column_no)
315 str->AppendF(":%d", g.gcc_location->column_no);
316 } else {
317 str->AppendF("%s", g.module_name);
318 }
319 if (print_module_name && info.module)
320 str->AppendF(" in %s", info.module);
321 }
322
323 } // namespace __asan
324
325 // ---------------------- Interface ---------------- {{{1
326 using namespace __asan;
327
328 // Apply __asan_register_globals to all globals found in the same loaded
329 // executable or shared library as `flag'. The flag tracks whether globals have
330 // already been registered or not for this image.
__asan_register_image_globals(uptr * flag)331 void __asan_register_image_globals(uptr *flag) {
332 if (*flag)
333 return;
334 AsanApplyToGlobals(__asan_register_globals, flag);
335 *flag = 1;
336 }
337
338 // This mirrors __asan_register_image_globals.
__asan_unregister_image_globals(uptr * flag)339 void __asan_unregister_image_globals(uptr *flag) {
340 if (!*flag)
341 return;
342 AsanApplyToGlobals(__asan_unregister_globals, flag);
343 *flag = 0;
344 }
345
__asan_register_elf_globals(uptr * flag,void * start,void * stop)346 void __asan_register_elf_globals(uptr *flag, void *start, void *stop) {
347 if (*flag || start == stop)
348 return;
349 CHECK_EQ(0, ((uptr)stop - (uptr)start) % sizeof(__asan_global));
350 __asan_global *globals_start = (__asan_global*)start;
351 __asan_global *globals_stop = (__asan_global*)stop;
352 __asan_register_globals(globals_start, globals_stop - globals_start);
353 *flag = 1;
354 }
355
__asan_unregister_elf_globals(uptr * flag,void * start,void * stop)356 void __asan_unregister_elf_globals(uptr *flag, void *start, void *stop) {
357 if (!*flag || start == stop)
358 return;
359 CHECK_EQ(0, ((uptr)stop - (uptr)start) % sizeof(__asan_global));
360 __asan_global *globals_start = (__asan_global*)start;
361 __asan_global *globals_stop = (__asan_global*)stop;
362 __asan_unregister_globals(globals_start, globals_stop - globals_start);
363 *flag = 0;
364 }
365
366 // Register an array of globals.
__asan_register_globals(__asan_global * globals,uptr n)367 void __asan_register_globals(__asan_global *globals, uptr n) {
368 if (!flags()->report_globals) return;
369 GET_STACK_TRACE_MALLOC;
370 u32 stack_id = StackDepotPut(stack);
371 Lock lock(&mu_for_globals);
372 if (!global_registration_site_vector) {
373 global_registration_site_vector =
374 new (GetGlobalLowLevelAllocator()) GlobalRegistrationSiteVector;
375 global_registration_site_vector->reserve(128);
376 }
377 GlobalRegistrationSite site = {stack_id, &globals[0], &globals[n - 1]};
378 global_registration_site_vector->push_back(site);
379 if (flags()->report_globals >= 2) {
380 PRINT_CURRENT_STACK();
381 Printf("=== ID %d; %p %p\n", stack_id, (void *)&globals[0],
382 (void *)&globals[n - 1]);
383 }
384 for (uptr i = 0; i < n; i++) {
385 if (SANITIZER_WINDOWS && globals[i].beg == 0) {
386 // The MSVC incremental linker may pad globals out to 256 bytes. As long
387 // as __asan_global is less than 256 bytes large and its size is a power
388 // of two, we can skip over the padding.
389 static_assert(
390 sizeof(__asan_global) < 256 &&
391 (sizeof(__asan_global) & (sizeof(__asan_global) - 1)) == 0,
392 "sizeof(__asan_global) incompatible with incremental linker padding");
393 // If these are padding bytes, the rest of the global should be zero.
394 CHECK(globals[i].size == 0 && globals[i].size_with_redzone == 0 &&
395 globals[i].name == nullptr && globals[i].module_name == nullptr &&
396 globals[i].odr_indicator == 0);
397 continue;
398 }
399 RegisterGlobal(&globals[i]);
400 }
401
402 // Poison the metadata. It should not be accessible to user code.
403 PoisonShadow(reinterpret_cast<uptr>(globals), n * sizeof(__asan_global),
404 kAsanGlobalRedzoneMagic);
405 }
406
407 // Unregister an array of globals.
408 // We must do this when a shared objects gets dlclosed.
__asan_unregister_globals(__asan_global * globals,uptr n)409 void __asan_unregister_globals(__asan_global *globals, uptr n) {
410 if (!flags()->report_globals) return;
411 Lock lock(&mu_for_globals);
412 for (uptr i = 0; i < n; i++) {
413 if (SANITIZER_WINDOWS && globals[i].beg == 0) {
414 // Skip globals that look like padding from the MSVC incremental linker.
415 // See comment in __asan_register_globals.
416 continue;
417 }
418 UnregisterGlobal(&globals[i]);
419 }
420
421 // Unpoison the metadata.
422 PoisonShadow(reinterpret_cast<uptr>(globals), n * sizeof(__asan_global), 0);
423 }
424
425 // This method runs immediately prior to dynamic initialization in each TU,
426 // when all dynamically initialized globals are unpoisoned. This method
427 // poisons all global variables not defined in this TU, so that a dynamic
428 // initializer can only touch global variables in the same TU.
__asan_before_dynamic_init(const char * module_name)429 void __asan_before_dynamic_init(const char *module_name) {
430 if (!flags()->check_initialization_order ||
431 !CanPoisonMemory() ||
432 !dynamic_init_globals)
433 return;
434 bool strict_init_order = flags()->strict_init_order;
435 CHECK(module_name);
436 CHECK(AsanInited());
437 Lock lock(&mu_for_globals);
438 if (flags()->report_globals >= 3)
439 Printf("DynInitPoison module: %s\n", module_name);
440 for (uptr i = 0, n = dynamic_init_globals->size(); i < n; ++i) {
441 DynInitGlobal &dyn_g = (*dynamic_init_globals)[i];
442 const Global *g = &dyn_g.g;
443 if (dyn_g.initialized)
444 continue;
445 if (g->module_name != module_name)
446 PoisonShadowForGlobal(g, kAsanInitializationOrderMagic);
447 else if (!strict_init_order)
448 dyn_g.initialized = true;
449 }
450 }
451
452 // This method runs immediately after dynamic initialization in each TU, when
453 // all dynamically initialized globals except for those defined in the current
454 // TU are poisoned. It simply unpoisons all dynamically initialized globals.
__asan_after_dynamic_init()455 void __asan_after_dynamic_init() {
456 if (!flags()->check_initialization_order ||
457 !CanPoisonMemory() ||
458 !dynamic_init_globals)
459 return;
460 CHECK(AsanInited());
461 Lock lock(&mu_for_globals);
462 // FIXME: Optionally report that we're unpoisoning globals from a module.
463 for (uptr i = 0, n = dynamic_init_globals->size(); i < n; ++i) {
464 DynInitGlobal &dyn_g = (*dynamic_init_globals)[i];
465 const Global *g = &dyn_g.g;
466 if (!dyn_g.initialized) {
467 // Unpoison the whole global.
468 PoisonShadowForGlobal(g, 0);
469 // Poison redzones back.
470 PoisonRedZones(*g);
471 }
472 }
473 }
474