xref: /freebsd/contrib/llvm-project/llvm/lib/Support/CrashRecoveryContext.cpp (revision 2a0c0aea42092f89c2a5345991e6e3ce4cbef99a)
1 //===--- CrashRecoveryContext.cpp - Crash Recovery ------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 
9 #include "llvm/Support/CrashRecoveryContext.h"
10 #include "llvm/Config/llvm-config.h"
11 #include "llvm/Support/ErrorHandling.h"
12 #include "llvm/Support/ExitCodes.h"
13 #include "llvm/Support/Signals.h"
14 #include "llvm/Support/thread.h"
15 #include <cassert>
16 #include <mutex>
17 #include <setjmp.h>
18 
19 using namespace llvm;
20 
21 namespace {
22 
23 struct CrashRecoveryContextImpl;
24 static LLVM_THREAD_LOCAL const CrashRecoveryContextImpl *CurrentContext;
25 
26 struct CrashRecoveryContextImpl {
27   // When threads are disabled, this links up all active
28   // CrashRecoveryContextImpls.  When threads are enabled there's one thread
29   // per CrashRecoveryContext and CurrentContext is a thread-local, so only one
30   // CrashRecoveryContextImpl is active per thread and this is always null.
31   const CrashRecoveryContextImpl *Next;
32 
33   CrashRecoveryContext *CRC;
34   ::jmp_buf JumpBuffer;
35   volatile unsigned Failed : 1;
36   unsigned SwitchedThread : 1;
37   unsigned ValidJumpBuffer : 1;
38 
39 public:
40   CrashRecoveryContextImpl(CrashRecoveryContext *CRC) noexcept
41       : CRC(CRC), Failed(false), SwitchedThread(false), ValidJumpBuffer(false) {
42     Next = CurrentContext;
43     CurrentContext = this;
44   }
45   ~CrashRecoveryContextImpl() {
46     if (!SwitchedThread)
47       CurrentContext = Next;
48   }
49 
50   /// Called when the separate crash-recovery thread was finished, to
51   /// indicate that we don't need to clear the thread-local CurrentContext.
52   void setSwitchedThread() {
53 #if defined(LLVM_ENABLE_THREADS) && LLVM_ENABLE_THREADS != 0
54     SwitchedThread = true;
55 #endif
56   }
57 
58   // If the function ran by the CrashRecoveryContext crashes or fails, then
59   // 'RetCode' represents the returned error code, as if it was returned by a
60   // process. 'Context' represents the signal type on Unix; on Windows, it is
61   // the ExceptionContext.
62   void HandleCrash(int RetCode, uintptr_t Context) {
63     // Eliminate the current context entry, to avoid re-entering in case the
64     // cleanup code crashes.
65     CurrentContext = Next;
66 
67     assert(!Failed && "Crash recovery context already failed!");
68     Failed = true;
69 
70     if (CRC->DumpStackAndCleanupOnFailure)
71       sys::CleanupOnSignal(Context);
72 
73     CRC->RetCode = RetCode;
74 
75     // Jump back to the RunSafely we were called under.
76     if (ValidJumpBuffer)
77       longjmp(JumpBuffer, 1);
78 
79     // Otherwise let the caller decide of the outcome of the crash. Currently
80     // this occurs when using SEH on Windows with MSVC or clang-cl.
81   }
82 };
83 
84 std::mutex &getCrashRecoveryContextMutex() {
85   static std::mutex CrashRecoveryContextMutex;
86   return CrashRecoveryContextMutex;
87 }
88 
89 static bool gCrashRecoveryEnabled = false;
90 
91 static LLVM_THREAD_LOCAL const CrashRecoveryContext *IsRecoveringFromCrash;
92 
93 } // namespace
94 
95 static void installExceptionOrSignalHandlers();
96 static void uninstallExceptionOrSignalHandlers();
97 
98 CrashRecoveryContextCleanup::~CrashRecoveryContextCleanup() = default;
99 
100 CrashRecoveryContext::CrashRecoveryContext() {
101   // On Windows, if abort() was previously triggered (and caught by a previous
102   // CrashRecoveryContext) the Windows CRT removes our installed signal handler,
103   // so we need to install it again.
104   sys::DisableSystemDialogsOnCrash();
105 }
106 
107 CrashRecoveryContext::~CrashRecoveryContext() {
108   // Reclaim registered resources.
109   CrashRecoveryContextCleanup *i = head;
110   const CrashRecoveryContext *PC = IsRecoveringFromCrash;
111   IsRecoveringFromCrash = this;
112   while (i) {
113     CrashRecoveryContextCleanup *tmp = i;
114     i = tmp->next;
115     tmp->cleanupFired = true;
116     tmp->recoverResources();
117     delete tmp;
118   }
119   IsRecoveringFromCrash = PC;
120 
121   CrashRecoveryContextImpl *CRCI = (CrashRecoveryContextImpl *) Impl;
122   delete CRCI;
123 }
124 
125 bool CrashRecoveryContext::isRecoveringFromCrash() {
126   return IsRecoveringFromCrash != nullptr;
127 }
128 
129 CrashRecoveryContext *CrashRecoveryContext::GetCurrent() {
130   if (!gCrashRecoveryEnabled)
131     return nullptr;
132 
133   const CrashRecoveryContextImpl *CRCI = CurrentContext;
134   if (!CRCI)
135     return nullptr;
136 
137   return CRCI->CRC;
138 }
139 
140 void CrashRecoveryContext::Enable() {
141   std::lock_guard<std::mutex> L(getCrashRecoveryContextMutex());
142   // FIXME: Shouldn't this be a refcount or something?
143   if (gCrashRecoveryEnabled)
144     return;
145   gCrashRecoveryEnabled = true;
146   installExceptionOrSignalHandlers();
147 }
148 
149 void CrashRecoveryContext::Disable() {
150   std::lock_guard<std::mutex> L(getCrashRecoveryContextMutex());
151   if (!gCrashRecoveryEnabled)
152     return;
153   gCrashRecoveryEnabled = false;
154   uninstallExceptionOrSignalHandlers();
155 }
156 
157 void CrashRecoveryContext::registerCleanup(CrashRecoveryContextCleanup *cleanup)
158 {
159   if (!cleanup)
160     return;
161   if (head)
162     head->prev = cleanup;
163   cleanup->next = head;
164   head = cleanup;
165 }
166 
167 void
168 CrashRecoveryContext::unregisterCleanup(CrashRecoveryContextCleanup *cleanup) {
169   if (!cleanup)
170     return;
171   if (cleanup == head) {
172     head = cleanup->next;
173     if (head)
174       head->prev = nullptr;
175   }
176   else {
177     cleanup->prev->next = cleanup->next;
178     if (cleanup->next)
179       cleanup->next->prev = cleanup->prev;
180   }
181   delete cleanup;
182 }
183 
184 #if defined(_MSC_VER)
185 
186 #include <windows.h> // for GetExceptionInformation
187 
188 // If _MSC_VER is defined, we must have SEH. Use it if it's available. It's way
189 // better than VEH. Vectored exception handling catches all exceptions happening
190 // on the thread with installed exception handlers, so it can interfere with
191 // internal exception handling of other libraries on that thread. SEH works
192 // exactly as you would expect normal exception handling to work: it only
193 // catches exceptions if they would bubble out from the stack frame with __try /
194 // __except.
195 
196 static void installExceptionOrSignalHandlers() {}
197 static void uninstallExceptionOrSignalHandlers() {}
198 
199 // We need this function because the call to GetExceptionInformation() can only
200 // occur inside the __except evaluation block
201 static int ExceptionFilter(_EXCEPTION_POINTERS *Except) {
202   // Lookup the current thread local recovery object.
203   const CrashRecoveryContextImpl *CRCI = CurrentContext;
204 
205   if (!CRCI) {
206     // Something has gone horribly wrong, so let's just tell everyone
207     // to keep searching
208     CrashRecoveryContext::Disable();
209     return EXCEPTION_CONTINUE_SEARCH;
210   }
211 
212   int RetCode = (int)Except->ExceptionRecord->ExceptionCode;
213   if ((RetCode & 0xF0000000) == 0xE0000000)
214     RetCode &= ~0xF0000000; // this crash was generated by sys::Process::Exit
215 
216   // Handle the crash
217   const_cast<CrashRecoveryContextImpl *>(CRCI)->HandleCrash(
218       RetCode, reinterpret_cast<uintptr_t>(Except));
219 
220   return EXCEPTION_EXECUTE_HANDLER;
221 }
222 
223 #if defined(__clang__) && defined(_M_IX86)
224 // Work around PR44697.
225 __attribute__((optnone))
226 #endif
227 bool CrashRecoveryContext::RunSafely(function_ref<void()> Fn) {
228   if (!gCrashRecoveryEnabled) {
229     Fn();
230     return true;
231   }
232   assert(!Impl && "Crash recovery context already initialized!");
233   Impl = new CrashRecoveryContextImpl(this);
234   __try {
235     Fn();
236   } __except (ExceptionFilter(GetExceptionInformation())) {
237     return false;
238   }
239   return true;
240 }
241 
242 #else // !_MSC_VER
243 
244 #if defined(_WIN32)
245 // This is a non-MSVC compiler, probably mingw gcc or clang without
246 // -fms-extensions. Use vectored exception handling (VEH).
247 //
248 // On Windows, we can make use of vectored exception handling to catch most
249 // crashing situations.  Note that this does mean we will be alerted of
250 // exceptions *before* structured exception handling has the opportunity to
251 // catch it. Unfortunately, this causes problems in practice with other code
252 // running on threads with LLVM crash recovery contexts, so we would like to
253 // eventually move away from VEH.
254 //
255 // Vectored works on a per-thread basis, which is an advantage over
256 // SetUnhandledExceptionFilter. SetUnhandledExceptionFilter also doesn't have
257 // any native support for chaining exception handlers, but VEH allows more than
258 // one.
259 //
260 // The vectored exception handler functionality was added in Windows
261 // XP, so if support for older versions of Windows is required,
262 // it will have to be added.
263 
264 #include "llvm/Support/Windows/WindowsSupport.h"
265 
266 static LONG CALLBACK ExceptionHandler(PEXCEPTION_POINTERS ExceptionInfo)
267 {
268   // DBG_PRINTEXCEPTION_WIDE_C is not properly defined on all supported
269   // compilers and platforms, so we define it manually.
270   constexpr ULONG DbgPrintExceptionWideC = 0x4001000AL;
271   switch (ExceptionInfo->ExceptionRecord->ExceptionCode)
272   {
273   case DBG_PRINTEXCEPTION_C:
274   case DbgPrintExceptionWideC:
275   case 0x406D1388:  // set debugger thread name
276     return EXCEPTION_CONTINUE_EXECUTION;
277   }
278 
279   // Lookup the current thread local recovery object.
280   const CrashRecoveryContextImpl *CRCI = CurrentContext;
281 
282   if (!CRCI) {
283     // Something has gone horribly wrong, so let's just tell everyone
284     // to keep searching
285     CrashRecoveryContext::Disable();
286     return EXCEPTION_CONTINUE_SEARCH;
287   }
288 
289   // TODO: We can capture the stack backtrace here and store it on the
290   // implementation if we so choose.
291 
292   int RetCode = (int)ExceptionInfo->ExceptionRecord->ExceptionCode;
293   if ((RetCode & 0xF0000000) == 0xE0000000)
294     RetCode &= ~0xF0000000; // this crash was generated by sys::Process::Exit
295 
296   // Handle the crash
297   const_cast<CrashRecoveryContextImpl *>(CRCI)->HandleCrash(
298       RetCode, reinterpret_cast<uintptr_t>(ExceptionInfo));
299 
300   // Note that we don't actually get here because HandleCrash calls
301   // longjmp, which means the HandleCrash function never returns.
302   llvm_unreachable("Handled the crash, should have longjmp'ed out of here");
303 }
304 
305 // Because the Enable and Disable calls are static, it means that
306 // there may not actually be an Impl available, or even a current
307 // CrashRecoveryContext at all.  So we make use of a thread-local
308 // exception table.  The handles contained in here will either be
309 // non-NULL, valid VEH handles, or NULL.
310 static LLVM_THREAD_LOCAL const void* sCurrentExceptionHandle;
311 
312 static void installExceptionOrSignalHandlers() {
313   // We can set up vectored exception handling now.  We will install our
314   // handler as the front of the list, though there's no assurances that
315   // it will remain at the front (another call could install itself before
316   // our handler).  This 1) isn't likely, and 2) shouldn't cause problems.
317   PVOID handle = ::AddVectoredExceptionHandler(1, ExceptionHandler);
318   sCurrentExceptionHandle = handle;
319 }
320 
321 static void uninstallExceptionOrSignalHandlers() {
322   PVOID currentHandle = const_cast<PVOID>(sCurrentExceptionHandle);
323   if (currentHandle) {
324     // Now we can remove the vectored exception handler from the chain
325     ::RemoveVectoredExceptionHandler(currentHandle);
326 
327     // Reset the handle in our thread-local set.
328     sCurrentExceptionHandle = NULL;
329   }
330 }
331 
332 #else // !_WIN32
333 
334 // Generic POSIX implementation.
335 //
336 // This implementation relies on synchronous signals being delivered to the
337 // current thread. We use a thread local object to keep track of the active
338 // crash recovery context, and install signal handlers to invoke HandleCrash on
339 // the active object.
340 //
341 // This implementation does not attempt to chain signal handlers in any
342 // reliable fashion -- if we get a signal outside of a crash recovery context we
343 // simply disable crash recovery and raise the signal again.
344 
345 #include <signal.h>
346 
347 static const int Signals[] =
348     { SIGABRT, SIGBUS, SIGFPE, SIGILL, SIGSEGV, SIGTRAP };
349 static const unsigned NumSignals = std::size(Signals);
350 static struct sigaction PrevActions[NumSignals];
351 
352 static void CrashRecoverySignalHandler(int Signal) {
353   // Lookup the current thread local recovery object.
354   const CrashRecoveryContextImpl *CRCI = CurrentContext;
355 
356   if (!CRCI) {
357     // We didn't find a crash recovery context -- this means either we got a
358     // signal on a thread we didn't expect it on, the application got a signal
359     // outside of a crash recovery context, or something else went horribly
360     // wrong.
361     //
362     // Disable crash recovery and raise the signal again. The assumption here is
363     // that the enclosing application will terminate soon, and we won't want to
364     // attempt crash recovery again.
365     //
366     // This call of Disable isn't thread safe, but it doesn't actually matter.
367     CrashRecoveryContext::Disable();
368     raise(Signal);
369 
370     // The signal will be thrown once the signal mask is restored.
371     return;
372   }
373 
374   // Unblock the signal we received.
375   sigset_t SigMask;
376   sigemptyset(&SigMask);
377   sigaddset(&SigMask, Signal);
378   sigprocmask(SIG_UNBLOCK, &SigMask, nullptr);
379 
380   // Return the same error code as if the program crashed, as mentioned in the
381   // section "Exit Status for Commands":
382   // https://pubs.opengroup.org/onlinepubs/9699919799/xrat/V4_xcu_chap02.html
383   int RetCode = 128 + Signal;
384 
385   // Don't consider a broken pipe as a crash (see clang/lib/Driver/Driver.cpp)
386   if (Signal == SIGPIPE)
387     RetCode = EX_IOERR;
388 
389   if (CRCI)
390     const_cast<CrashRecoveryContextImpl *>(CRCI)->HandleCrash(RetCode, Signal);
391 }
392 
393 static void installExceptionOrSignalHandlers() {
394   // Setup the signal handler.
395   struct sigaction Handler;
396   Handler.sa_handler = CrashRecoverySignalHandler;
397   Handler.sa_flags = 0;
398   sigemptyset(&Handler.sa_mask);
399 
400   for (unsigned i = 0; i != NumSignals; ++i) {
401     sigaction(Signals[i], &Handler, &PrevActions[i]);
402   }
403 }
404 
405 static void uninstallExceptionOrSignalHandlers() {
406   // Restore the previous signal handlers.
407   for (unsigned i = 0; i != NumSignals; ++i)
408     sigaction(Signals[i], &PrevActions[i], nullptr);
409 }
410 
411 #endif // !_WIN32
412 
413 bool CrashRecoveryContext::RunSafely(function_ref<void()> Fn) {
414   // If crash recovery is disabled, do nothing.
415   if (gCrashRecoveryEnabled) {
416     assert(!Impl && "Crash recovery context already initialized!");
417     CrashRecoveryContextImpl *CRCI = new CrashRecoveryContextImpl(this);
418     Impl = CRCI;
419 
420     CRCI->ValidJumpBuffer = true;
421     if (setjmp(CRCI->JumpBuffer) != 0) {
422       return false;
423     }
424   }
425 
426   Fn();
427   return true;
428 }
429 
430 #endif // !_MSC_VER
431 
432 [[noreturn]] void CrashRecoveryContext::HandleExit(int RetCode) {
433 #if defined(_WIN32)
434   // SEH and VEH
435   ::RaiseException(0xE0000000 | RetCode, 0, 0, NULL);
436 #else
437   // On Unix we don't need to raise an exception, we go directly to
438   // HandleCrash(), then longjmp will unwind the stack for us.
439   CrashRecoveryContextImpl *CRCI = (CrashRecoveryContextImpl *)Impl;
440   assert(CRCI && "Crash recovery context never initialized!");
441   CRCI->HandleCrash(RetCode, 0 /*no sig num*/);
442 #endif
443   llvm_unreachable("Most likely setjmp wasn't called!");
444 }
445 
446 bool CrashRecoveryContext::isCrash(int RetCode) {
447 #if defined(_WIN32)
448   // On Windows, the high bits are reserved for kernel return codes. Values
449   // starting with 0x80000000 are reserved for "warnings"; values of 0xC0000000
450   // and up are for "errors". In practice, both are interpreted as a
451   // non-continuable signal.
452   unsigned Code = ((unsigned)RetCode & 0xF0000000) >> 28;
453   if (Code != 0xC && Code != 8)
454     return false;
455 #else
456   // On Unix, signals are represented by return codes of 128 or higher.
457   // Exit code 128 is a reserved value and should not be raised as a signal.
458   if (RetCode <= 128)
459     return false;
460 #endif
461   return true;
462 }
463 
464 bool CrashRecoveryContext::throwIfCrash(int RetCode) {
465   if (!isCrash(RetCode))
466     return false;
467 #if defined(_WIN32)
468   ::RaiseException(RetCode, 0, 0, NULL);
469 #else
470   llvm::sys::unregisterHandlers();
471   raise(RetCode - 128);
472 #endif
473   return true;
474 }
475 
476 // FIXME: Portability.
477 static void setThreadBackgroundPriority() {
478 #ifdef __APPLE__
479   setpriority(PRIO_DARWIN_THREAD, 0, PRIO_DARWIN_BG);
480 #endif
481 }
482 
483 static bool hasThreadBackgroundPriority() {
484 #ifdef __APPLE__
485   return getpriority(PRIO_DARWIN_THREAD, 0) == 1;
486 #else
487   return false;
488 #endif
489 }
490 
491 namespace {
492 struct RunSafelyOnThreadInfo {
493   function_ref<void()> Fn;
494   CrashRecoveryContext *CRC;
495   bool UseBackgroundPriority;
496   bool Result;
497 };
498 } // namespace
499 
500 static void RunSafelyOnThread_Dispatch(void *UserData) {
501   RunSafelyOnThreadInfo *Info =
502     reinterpret_cast<RunSafelyOnThreadInfo*>(UserData);
503 
504   if (Info->UseBackgroundPriority)
505     setThreadBackgroundPriority();
506 
507   Info->Result = Info->CRC->RunSafely(Info->Fn);
508 }
509 bool CrashRecoveryContext::RunSafelyOnThread(function_ref<void()> Fn,
510                                              unsigned RequestedStackSize) {
511   bool UseBackgroundPriority = hasThreadBackgroundPriority();
512   RunSafelyOnThreadInfo Info = { Fn, this, UseBackgroundPriority, false };
513   llvm::thread Thread(RequestedStackSize == 0
514                           ? std::nullopt
515                           : std::optional<unsigned>(RequestedStackSize),
516                       RunSafelyOnThread_Dispatch, &Info);
517   Thread.join();
518 
519   if (CrashRecoveryContextImpl *CRC = (CrashRecoveryContextImpl *)Impl)
520     CRC->setSwitchedThread();
521   return Info.Result;
522 }
523