xref: /freebsd/contrib/llvm-project/llvm/lib/CodeGen/StackProtector.cpp (revision 1db9f3b21e39176dd5b67cf8ac378633b172463e)
1 //===- StackProtector.cpp - Stack Protector Insertion ---------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This pass inserts stack protectors into functions which need them. A variable
10 // with a random value in it is stored onto the stack before the local variables
11 // are allocated. Upon exiting the block, the stored value is checked. If it's
12 // changed, then there was some sort of violation and the program aborts.
13 //
14 //===----------------------------------------------------------------------===//
15 
16 #include "llvm/CodeGen/StackProtector.h"
17 #include "llvm/ADT/SmallPtrSet.h"
18 #include "llvm/ADT/SmallVector.h"
19 #include "llvm/ADT/Statistic.h"
20 #include "llvm/Analysis/BranchProbabilityInfo.h"
21 #include "llvm/Analysis/MemoryLocation.h"
22 #include "llvm/Analysis/OptimizationRemarkEmitter.h"
23 #include "llvm/CodeGen/Passes.h"
24 #include "llvm/CodeGen/TargetLowering.h"
25 #include "llvm/CodeGen/TargetPassConfig.h"
26 #include "llvm/CodeGen/TargetSubtargetInfo.h"
27 #include "llvm/IR/Attributes.h"
28 #include "llvm/IR/BasicBlock.h"
29 #include "llvm/IR/Constants.h"
30 #include "llvm/IR/DataLayout.h"
31 #include "llvm/IR/DerivedTypes.h"
32 #include "llvm/IR/Dominators.h"
33 #include "llvm/IR/EHPersonalities.h"
34 #include "llvm/IR/Function.h"
35 #include "llvm/IR/IRBuilder.h"
36 #include "llvm/IR/Instruction.h"
37 #include "llvm/IR/Instructions.h"
38 #include "llvm/IR/IntrinsicInst.h"
39 #include "llvm/IR/Intrinsics.h"
40 #include "llvm/IR/MDBuilder.h"
41 #include "llvm/IR/Module.h"
42 #include "llvm/IR/Type.h"
43 #include "llvm/IR/User.h"
44 #include "llvm/InitializePasses.h"
45 #include "llvm/Pass.h"
46 #include "llvm/Support/Casting.h"
47 #include "llvm/Support/CommandLine.h"
48 #include "llvm/Target/TargetMachine.h"
49 #include "llvm/Target/TargetOptions.h"
50 #include "llvm/Transforms/Utils/BasicBlockUtils.h"
51 #include <optional>
52 #include <utility>
53 
54 using namespace llvm;
55 
56 #define DEBUG_TYPE "stack-protector"
57 
58 STATISTIC(NumFunProtected, "Number of functions protected");
59 STATISTIC(NumAddrTaken, "Number of local variables that have their address"
60                         " taken.");
61 
62 static cl::opt<bool> EnableSelectionDAGSP("enable-selectiondag-sp",
63                                           cl::init(true), cl::Hidden);
64 static cl::opt<bool> DisableCheckNoReturn("disable-check-noreturn-call",
65                                           cl::init(false), cl::Hidden);
66 
67 /// InsertStackProtectors - Insert code into the prologue and epilogue of the
68 /// function.
69 ///
70 ///  - The prologue code loads and stores the stack guard onto the stack.
71 ///  - The epilogue checks the value stored in the prologue against the original
72 ///    value. It calls __stack_chk_fail if they differ.
73 static bool InsertStackProtectors(const TargetMachine *TM, Function *F,
74                                   DomTreeUpdater *DTU, bool &HasPrologue,
75                                   bool &HasIRCheck);
76 
77 /// CreateFailBB - Create a basic block to jump to when the stack protector
78 /// check fails.
79 static BasicBlock *CreateFailBB(Function *F, const Triple &Trip);
80 
81 bool SSPLayoutInfo::shouldEmitSDCheck(const BasicBlock &BB) const {
82   return HasPrologue && !HasIRCheck && isa<ReturnInst>(BB.getTerminator());
83 }
84 
85 void SSPLayoutInfo::copyToMachineFrameInfo(MachineFrameInfo &MFI) const {
86   if (Layout.empty())
87     return;
88 
89   for (int I = 0, E = MFI.getObjectIndexEnd(); I != E; ++I) {
90     if (MFI.isDeadObjectIndex(I))
91       continue;
92 
93     const AllocaInst *AI = MFI.getObjectAllocation(I);
94     if (!AI)
95       continue;
96 
97     SSPLayoutMap::const_iterator LI = Layout.find(AI);
98     if (LI == Layout.end())
99       continue;
100 
101     MFI.setObjectSSPLayout(I, LI->second);
102   }
103 }
104 
105 SSPLayoutInfo SSPLayoutAnalysis::run(Function &F,
106                                      FunctionAnalysisManager &FAM) {
107 
108   SSPLayoutInfo Info;
109   Info.RequireStackProtector =
110       SSPLayoutAnalysis::requiresStackProtector(&F, &Info.Layout);
111   Info.SSPBufferSize = F.getFnAttributeAsParsedInteger(
112       "stack-protector-buffer-size", SSPLayoutInfo::DefaultSSPBufferSize);
113   return Info;
114 }
115 
116 AnalysisKey SSPLayoutAnalysis::Key;
117 
118 PreservedAnalyses StackProtectorPass::run(Function &F,
119                                           FunctionAnalysisManager &FAM) {
120   auto &Info = FAM.getResult<SSPLayoutAnalysis>(F);
121   auto *DT = FAM.getCachedResult<DominatorTreeAnalysis>(F);
122   DomTreeUpdater DTU(DT, DomTreeUpdater::UpdateStrategy::Lazy);
123 
124   if (!Info.RequireStackProtector)
125     return PreservedAnalyses::all();
126 
127   // TODO(etienneb): Functions with funclets are not correctly supported now.
128   // Do nothing if this is funclet-based personality.
129   if (F.hasPersonalityFn()) {
130     EHPersonality Personality = classifyEHPersonality(F.getPersonalityFn());
131     if (isFuncletEHPersonality(Personality))
132       return PreservedAnalyses::all();
133   }
134 
135   ++NumFunProtected;
136   bool Changed = InsertStackProtectors(TM, &F, DT ? &DTU : nullptr,
137                                        Info.HasPrologue, Info.HasIRCheck);
138 #ifdef EXPENSIVE_CHECKS
139   assert((!DT || DT->verify(DominatorTree::VerificationLevel::Full)) &&
140          "Failed to maintain validity of domtree!");
141 #endif
142 
143   if (!Changed)
144     return PreservedAnalyses::all();
145   PreservedAnalyses PA;
146   PA.preserve<SSPLayoutAnalysis>();
147   PA.preserve<DominatorTreeAnalysis>();
148   return PA;
149 }
150 
151 char StackProtector::ID = 0;
152 
153 StackProtector::StackProtector() : FunctionPass(ID) {
154   initializeStackProtectorPass(*PassRegistry::getPassRegistry());
155 }
156 
157 INITIALIZE_PASS_BEGIN(StackProtector, DEBUG_TYPE,
158                       "Insert stack protectors", false, true)
159 INITIALIZE_PASS_DEPENDENCY(TargetPassConfig)
160 INITIALIZE_PASS_DEPENDENCY(DominatorTreeWrapperPass)
161 INITIALIZE_PASS_END(StackProtector, DEBUG_TYPE,
162                     "Insert stack protectors", false, true)
163 
164 FunctionPass *llvm::createStackProtectorPass() { return new StackProtector(); }
165 
166 void StackProtector::getAnalysisUsage(AnalysisUsage &AU) const {
167   AU.addRequired<TargetPassConfig>();
168   AU.addPreserved<DominatorTreeWrapperPass>();
169 }
170 
171 bool StackProtector::runOnFunction(Function &Fn) {
172   F = &Fn;
173   M = F->getParent();
174   if (auto *DTWP = getAnalysisIfAvailable<DominatorTreeWrapperPass>())
175     DTU.emplace(DTWP->getDomTree(), DomTreeUpdater::UpdateStrategy::Lazy);
176   TM = &getAnalysis<TargetPassConfig>().getTM<TargetMachine>();
177   LayoutInfo.HasPrologue = false;
178   LayoutInfo.HasIRCheck = false;
179 
180   LayoutInfo.SSPBufferSize = Fn.getFnAttributeAsParsedInteger(
181       "stack-protector-buffer-size", SSPLayoutInfo::DefaultSSPBufferSize);
182   if (!requiresStackProtector(F, &LayoutInfo.Layout))
183     return false;
184 
185   // TODO(etienneb): Functions with funclets are not correctly supported now.
186   // Do nothing if this is funclet-based personality.
187   if (Fn.hasPersonalityFn()) {
188     EHPersonality Personality = classifyEHPersonality(Fn.getPersonalityFn());
189     if (isFuncletEHPersonality(Personality))
190       return false;
191   }
192 
193   ++NumFunProtected;
194   bool Changed =
195       InsertStackProtectors(TM, F, DTU ? &*DTU : nullptr,
196                             LayoutInfo.HasPrologue, LayoutInfo.HasIRCheck);
197 #ifdef EXPENSIVE_CHECKS
198   assert((!DTU ||
199           DTU->getDomTree().verify(DominatorTree::VerificationLevel::Full)) &&
200          "Failed to maintain validity of domtree!");
201 #endif
202   DTU.reset();
203   return Changed;
204 }
205 
206 /// \param [out] IsLarge is set to true if a protectable array is found and
207 /// it is "large" ( >= ssp-buffer-size).  In the case of a structure with
208 /// multiple arrays, this gets set if any of them is large.
209 static bool ContainsProtectableArray(Type *Ty, Module *M, unsigned SSPBufferSize,
210                                      bool &IsLarge, bool Strong,
211                                      bool InStruct) {
212   if (!Ty)
213     return false;
214   if (ArrayType *AT = dyn_cast<ArrayType>(Ty)) {
215     if (!AT->getElementType()->isIntegerTy(8)) {
216       // If we're on a non-Darwin platform or we're inside of a structure, don't
217       // add stack protectors unless the array is a character array.
218       // However, in strong mode any array, regardless of type and size,
219       // triggers a protector.
220       if (!Strong && (InStruct || !Triple(M->getTargetTriple()).isOSDarwin()))
221         return false;
222     }
223 
224     // If an array has more than SSPBufferSize bytes of allocated space, then we
225     // emit stack protectors.
226     if (SSPBufferSize <= M->getDataLayout().getTypeAllocSize(AT)) {
227       IsLarge = true;
228       return true;
229     }
230 
231     if (Strong)
232       // Require a protector for all arrays in strong mode
233       return true;
234   }
235 
236   const StructType *ST = dyn_cast<StructType>(Ty);
237   if (!ST)
238     return false;
239 
240   bool NeedsProtector = false;
241   for (Type *ET : ST->elements())
242     if (ContainsProtectableArray(ET, M, SSPBufferSize, IsLarge, Strong, true)) {
243       // If the element is a protectable array and is large (>= SSPBufferSize)
244       // then we are done.  If the protectable array is not large, then
245       // keep looking in case a subsequent element is a large array.
246       if (IsLarge)
247         return true;
248       NeedsProtector = true;
249     }
250 
251   return NeedsProtector;
252 }
253 
254 /// Check whether a stack allocation has its address taken.
255 static bool HasAddressTaken(const Instruction *AI, TypeSize AllocSize,
256                             Module *M,
257                             SmallPtrSet<const PHINode *, 16> &VisitedPHIs) {
258   const DataLayout &DL = M->getDataLayout();
259   for (const User *U : AI->users()) {
260     const auto *I = cast<Instruction>(U);
261     // If this instruction accesses memory make sure it doesn't access beyond
262     // the bounds of the allocated object.
263     std::optional<MemoryLocation> MemLoc = MemoryLocation::getOrNone(I);
264     if (MemLoc && MemLoc->Size.hasValue() &&
265         !TypeSize::isKnownGE(AllocSize, MemLoc->Size.getValue()))
266       return true;
267     switch (I->getOpcode()) {
268     case Instruction::Store:
269       if (AI == cast<StoreInst>(I)->getValueOperand())
270         return true;
271       break;
272     case Instruction::AtomicCmpXchg:
273       // cmpxchg conceptually includes both a load and store from the same
274       // location. So, like store, the value being stored is what matters.
275       if (AI == cast<AtomicCmpXchgInst>(I)->getNewValOperand())
276         return true;
277       break;
278     case Instruction::PtrToInt:
279       if (AI == cast<PtrToIntInst>(I)->getOperand(0))
280         return true;
281       break;
282     case Instruction::Call: {
283       // Ignore intrinsics that do not become real instructions.
284       // TODO: Narrow this to intrinsics that have store-like effects.
285       const auto *CI = cast<CallInst>(I);
286       if (!CI->isDebugOrPseudoInst() && !CI->isLifetimeStartOrEnd())
287         return true;
288       break;
289     }
290     case Instruction::Invoke:
291       return true;
292     case Instruction::GetElementPtr: {
293       // If the GEP offset is out-of-bounds, or is non-constant and so has to be
294       // assumed to be potentially out-of-bounds, then any memory access that
295       // would use it could also be out-of-bounds meaning stack protection is
296       // required.
297       const GetElementPtrInst *GEP = cast<GetElementPtrInst>(I);
298       unsigned IndexSize = DL.getIndexTypeSizeInBits(I->getType());
299       APInt Offset(IndexSize, 0);
300       if (!GEP->accumulateConstantOffset(DL, Offset))
301         return true;
302       TypeSize OffsetSize = TypeSize::getFixed(Offset.getLimitedValue());
303       if (!TypeSize::isKnownGT(AllocSize, OffsetSize))
304         return true;
305       // Adjust AllocSize to be the space remaining after this offset.
306       // We can't subtract a fixed size from a scalable one, so in that case
307       // assume the scalable value is of minimum size.
308       TypeSize NewAllocSize =
309           TypeSize::getFixed(AllocSize.getKnownMinValue()) - OffsetSize;
310       if (HasAddressTaken(I, NewAllocSize, M, VisitedPHIs))
311         return true;
312       break;
313     }
314     case Instruction::BitCast:
315     case Instruction::Select:
316     case Instruction::AddrSpaceCast:
317       if (HasAddressTaken(I, AllocSize, M, VisitedPHIs))
318         return true;
319       break;
320     case Instruction::PHI: {
321       // Keep track of what PHI nodes we have already visited to ensure
322       // they are only visited once.
323       const auto *PN = cast<PHINode>(I);
324       if (VisitedPHIs.insert(PN).second)
325         if (HasAddressTaken(PN, AllocSize, M, VisitedPHIs))
326           return true;
327       break;
328     }
329     case Instruction::Load:
330     case Instruction::AtomicRMW:
331     case Instruction::Ret:
332       // These instructions take an address operand, but have load-like or
333       // other innocuous behavior that should not trigger a stack protector.
334       // atomicrmw conceptually has both load and store semantics, but the
335       // value being stored must be integer; so if a pointer is being stored,
336       // we'll catch it in the PtrToInt case above.
337       break;
338     default:
339       // Conservatively return true for any instruction that takes an address
340       // operand, but is not handled above.
341       return true;
342     }
343   }
344   return false;
345 }
346 
347 /// Search for the first call to the llvm.stackprotector intrinsic and return it
348 /// if present.
349 static const CallInst *findStackProtectorIntrinsic(Function &F) {
350   for (const BasicBlock &BB : F)
351     for (const Instruction &I : BB)
352       if (const auto *II = dyn_cast<IntrinsicInst>(&I))
353         if (II->getIntrinsicID() == Intrinsic::stackprotector)
354           return II;
355   return nullptr;
356 }
357 
358 /// Check whether or not this function needs a stack protector based
359 /// upon the stack protector level.
360 ///
361 /// We use two heuristics: a standard (ssp) and strong (sspstrong).
362 /// The standard heuristic which will add a guard variable to functions that
363 /// call alloca with a either a variable size or a size >= SSPBufferSize,
364 /// functions with character buffers larger than SSPBufferSize, and functions
365 /// with aggregates containing character buffers larger than SSPBufferSize. The
366 /// strong heuristic will add a guard variables to functions that call alloca
367 /// regardless of size, functions with any buffer regardless of type and size,
368 /// functions with aggregates that contain any buffer regardless of type and
369 /// size, and functions that contain stack-based variables that have had their
370 /// address taken.
371 bool SSPLayoutAnalysis::requiresStackProtector(Function *F,
372                                                SSPLayoutMap *Layout) {
373   Module *M = F->getParent();
374   bool Strong = false;
375   bool NeedsProtector = false;
376 
377   // The set of PHI nodes visited when determining if a variable's reference has
378   // been taken.  This set is maintained to ensure we don't visit the same PHI
379   // node multiple times.
380   SmallPtrSet<const PHINode *, 16> VisitedPHIs;
381 
382   unsigned SSPBufferSize = F->getFnAttributeAsParsedInteger(
383       "stack-protector-buffer-size", SSPLayoutInfo::DefaultSSPBufferSize);
384 
385   if (F->hasFnAttribute(Attribute::SafeStack))
386     return false;
387 
388   // We are constructing the OptimizationRemarkEmitter on the fly rather than
389   // using the analysis pass to avoid building DominatorTree and LoopInfo which
390   // are not available this late in the IR pipeline.
391   OptimizationRemarkEmitter ORE(F);
392 
393   if (F->hasFnAttribute(Attribute::StackProtectReq)) {
394     if (!Layout)
395       return true;
396     ORE.emit([&]() {
397       return OptimizationRemark(DEBUG_TYPE, "StackProtectorRequested", F)
398              << "Stack protection applied to function "
399              << ore::NV("Function", F)
400              << " due to a function attribute or command-line switch";
401     });
402     NeedsProtector = true;
403     Strong = true; // Use the same heuristic as strong to determine SSPLayout
404   } else if (F->hasFnAttribute(Attribute::StackProtectStrong))
405     Strong = true;
406   else if (!F->hasFnAttribute(Attribute::StackProtect))
407     return false;
408 
409   for (const BasicBlock &BB : *F) {
410     for (const Instruction &I : BB) {
411       if (const AllocaInst *AI = dyn_cast<AllocaInst>(&I)) {
412         if (AI->isArrayAllocation()) {
413           auto RemarkBuilder = [&]() {
414             return OptimizationRemark(DEBUG_TYPE, "StackProtectorAllocaOrArray",
415                                       &I)
416                    << "Stack protection applied to function "
417                    << ore::NV("Function", F)
418                    << " due to a call to alloca or use of a variable length "
419                       "array";
420           };
421           if (const auto *CI = dyn_cast<ConstantInt>(AI->getArraySize())) {
422             if (CI->getLimitedValue(SSPBufferSize) >= SSPBufferSize) {
423               // A call to alloca with size >= SSPBufferSize requires
424               // stack protectors.
425               if (!Layout)
426                 return true;
427               Layout->insert(
428                   std::make_pair(AI, MachineFrameInfo::SSPLK_LargeArray));
429               ORE.emit(RemarkBuilder);
430               NeedsProtector = true;
431             } else if (Strong) {
432               // Require protectors for all alloca calls in strong mode.
433               if (!Layout)
434                 return true;
435               Layout->insert(
436                   std::make_pair(AI, MachineFrameInfo::SSPLK_SmallArray));
437               ORE.emit(RemarkBuilder);
438               NeedsProtector = true;
439             }
440           } else {
441             // A call to alloca with a variable size requires protectors.
442             if (!Layout)
443               return true;
444             Layout->insert(
445                 std::make_pair(AI, MachineFrameInfo::SSPLK_LargeArray));
446             ORE.emit(RemarkBuilder);
447             NeedsProtector = true;
448           }
449           continue;
450         }
451 
452         bool IsLarge = false;
453         if (ContainsProtectableArray(AI->getAllocatedType(), M, SSPBufferSize,
454                                      IsLarge, Strong, false)) {
455           if (!Layout)
456             return true;
457           Layout->insert(std::make_pair(
458               AI, IsLarge ? MachineFrameInfo::SSPLK_LargeArray
459                           : MachineFrameInfo::SSPLK_SmallArray));
460           ORE.emit([&]() {
461             return OptimizationRemark(DEBUG_TYPE, "StackProtectorBuffer", &I)
462                    << "Stack protection applied to function "
463                    << ore::NV("Function", F)
464                    << " due to a stack allocated buffer or struct containing a "
465                       "buffer";
466           });
467           NeedsProtector = true;
468           continue;
469         }
470 
471         if (Strong &&
472             HasAddressTaken(
473                 AI, M->getDataLayout().getTypeAllocSize(AI->getAllocatedType()),
474                 M, VisitedPHIs)) {
475           ++NumAddrTaken;
476           if (!Layout)
477             return true;
478           Layout->insert(std::make_pair(AI, MachineFrameInfo::SSPLK_AddrOf));
479           ORE.emit([&]() {
480             return OptimizationRemark(DEBUG_TYPE, "StackProtectorAddressTaken",
481                                       &I)
482                    << "Stack protection applied to function "
483                    << ore::NV("Function", F)
484                    << " due to the address of a local variable being taken";
485           });
486           NeedsProtector = true;
487         }
488         // Clear any PHIs that we visited, to make sure we examine all uses of
489         // any subsequent allocas that we look at.
490         VisitedPHIs.clear();
491       }
492     }
493   }
494 
495   return NeedsProtector;
496 }
497 
498 /// Create a stack guard loading and populate whether SelectionDAG SSP is
499 /// supported.
500 static Value *getStackGuard(const TargetLoweringBase *TLI, Module *M,
501                             IRBuilder<> &B,
502                             bool *SupportsSelectionDAGSP = nullptr) {
503   Value *Guard = TLI->getIRStackGuard(B);
504   StringRef GuardMode = M->getStackProtectorGuard();
505   if ((GuardMode == "tls" || GuardMode.empty()) && Guard)
506     return B.CreateLoad(B.getPtrTy(), Guard, true, "StackGuard");
507 
508   // Use SelectionDAG SSP handling, since there isn't an IR guard.
509   //
510   // This is more or less weird, since we optionally output whether we
511   // should perform a SelectionDAG SP here. The reason is that it's strictly
512   // defined as !TLI->getIRStackGuard(B), where getIRStackGuard is also
513   // mutating. There is no way to get this bit without mutating the IR, so
514   // getting this bit has to happen in this right time.
515   //
516   // We could have define a new function TLI::supportsSelectionDAGSP(), but that
517   // will put more burden on the backends' overriding work, especially when it
518   // actually conveys the same information getIRStackGuard() already gives.
519   if (SupportsSelectionDAGSP)
520     *SupportsSelectionDAGSP = true;
521   TLI->insertSSPDeclarations(*M);
522   return B.CreateCall(Intrinsic::getDeclaration(M, Intrinsic::stackguard));
523 }
524 
525 /// Insert code into the entry block that stores the stack guard
526 /// variable onto the stack:
527 ///
528 ///   entry:
529 ///     StackGuardSlot = alloca i8*
530 ///     StackGuard = <stack guard>
531 ///     call void @llvm.stackprotector(StackGuard, StackGuardSlot)
532 ///
533 /// Returns true if the platform/triple supports the stackprotectorcreate pseudo
534 /// node.
535 static bool CreatePrologue(Function *F, Module *M, Instruction *CheckLoc,
536                            const TargetLoweringBase *TLI, AllocaInst *&AI) {
537   bool SupportsSelectionDAGSP = false;
538   IRBuilder<> B(&F->getEntryBlock().front());
539   PointerType *PtrTy = PointerType::getUnqual(CheckLoc->getContext());
540   AI = B.CreateAlloca(PtrTy, nullptr, "StackGuardSlot");
541 
542   Value *GuardSlot = getStackGuard(TLI, M, B, &SupportsSelectionDAGSP);
543   B.CreateCall(Intrinsic::getDeclaration(M, Intrinsic::stackprotector),
544                {GuardSlot, AI});
545   return SupportsSelectionDAGSP;
546 }
547 
548 bool InsertStackProtectors(const TargetMachine *TM, Function *F,
549                            DomTreeUpdater *DTU, bool &HasPrologue,
550                            bool &HasIRCheck) {
551   auto *M = F->getParent();
552   auto *TLI = TM->getSubtargetImpl(*F)->getTargetLowering();
553 
554   // If the target wants to XOR the frame pointer into the guard value, it's
555   // impossible to emit the check in IR, so the target *must* support stack
556   // protection in SDAG.
557   bool SupportsSelectionDAGSP =
558       TLI->useStackGuardXorFP() ||
559       (EnableSelectionDAGSP && !TM->Options.EnableFastISel);
560   AllocaInst *AI = nullptr; // Place on stack that stores the stack guard.
561   BasicBlock *FailBB = nullptr;
562 
563   for (BasicBlock &BB : llvm::make_early_inc_range(*F)) {
564     // This is stack protector auto generated check BB, skip it.
565     if (&BB == FailBB)
566       continue;
567     Instruction *CheckLoc = dyn_cast<ReturnInst>(BB.getTerminator());
568     if (!CheckLoc && !DisableCheckNoReturn)
569       for (auto &Inst : BB)
570         if (auto *CB = dyn_cast<CallBase>(&Inst))
571           // Do stack check before noreturn calls that aren't nounwind (e.g:
572           // __cxa_throw).
573           if (CB->doesNotReturn() && !CB->doesNotThrow()) {
574             CheckLoc = CB;
575             break;
576           }
577 
578     if (!CheckLoc)
579       continue;
580 
581     // Generate prologue instrumentation if not already generated.
582     if (!HasPrologue) {
583       HasPrologue = true;
584       SupportsSelectionDAGSP &= CreatePrologue(F, M, CheckLoc, TLI, AI);
585     }
586 
587     // SelectionDAG based code generation. Nothing else needs to be done here.
588     // The epilogue instrumentation is postponed to SelectionDAG.
589     if (SupportsSelectionDAGSP)
590       break;
591 
592     // Find the stack guard slot if the prologue was not created by this pass
593     // itself via a previous call to CreatePrologue().
594     if (!AI) {
595       const CallInst *SPCall = findStackProtectorIntrinsic(*F);
596       assert(SPCall && "Call to llvm.stackprotector is missing");
597       AI = cast<AllocaInst>(SPCall->getArgOperand(1));
598     }
599 
600     // Set HasIRCheck to true, so that SelectionDAG will not generate its own
601     // version. SelectionDAG called 'shouldEmitSDCheck' to check whether
602     // instrumentation has already been generated.
603     HasIRCheck = true;
604 
605     // If we're instrumenting a block with a tail call, the check has to be
606     // inserted before the call rather than between it and the return. The
607     // verifier guarantees that a tail call is either directly before the
608     // return or with a single correct bitcast of the return value in between so
609     // we don't need to worry about many situations here.
610     Instruction *Prev = CheckLoc->getPrevNonDebugInstruction();
611     if (Prev && isa<CallInst>(Prev) && cast<CallInst>(Prev)->isTailCall())
612       CheckLoc = Prev;
613     else if (Prev) {
614       Prev = Prev->getPrevNonDebugInstruction();
615       if (Prev && isa<CallInst>(Prev) && cast<CallInst>(Prev)->isTailCall())
616         CheckLoc = Prev;
617     }
618 
619     // Generate epilogue instrumentation. The epilogue intrumentation can be
620     // function-based or inlined depending on which mechanism the target is
621     // providing.
622     if (Function *GuardCheck = TLI->getSSPStackGuardCheck(*M)) {
623       // Generate the function-based epilogue instrumentation.
624       // The target provides a guard check function, generate a call to it.
625       IRBuilder<> B(CheckLoc);
626       LoadInst *Guard = B.CreateLoad(B.getPtrTy(), AI, true, "Guard");
627       CallInst *Call = B.CreateCall(GuardCheck, {Guard});
628       Call->setAttributes(GuardCheck->getAttributes());
629       Call->setCallingConv(GuardCheck->getCallingConv());
630     } else {
631       // Generate the epilogue with inline instrumentation.
632       // If we do not support SelectionDAG based calls, generate IR level
633       // calls.
634       //
635       // For each block with a return instruction, convert this:
636       //
637       //   return:
638       //     ...
639       //     ret ...
640       //
641       // into this:
642       //
643       //   return:
644       //     ...
645       //     %1 = <stack guard>
646       //     %2 = load StackGuardSlot
647       //     %3 = icmp ne i1 %1, %2
648       //     br i1 %3, label %CallStackCheckFailBlk, label %SP_return
649       //
650       //   SP_return:
651       //     ret ...
652       //
653       //   CallStackCheckFailBlk:
654       //     call void @__stack_chk_fail()
655       //     unreachable
656 
657       // Create the FailBB. We duplicate the BB every time since the MI tail
658       // merge pass will merge together all of the various BB into one including
659       // fail BB generated by the stack protector pseudo instruction.
660       if (!FailBB)
661         FailBB = CreateFailBB(F, TM->getTargetTriple());
662 
663       IRBuilder<> B(CheckLoc);
664       Value *Guard = getStackGuard(TLI, M, B);
665       LoadInst *LI2 = B.CreateLoad(B.getPtrTy(), AI, true);
666       auto *Cmp = cast<ICmpInst>(B.CreateICmpNE(Guard, LI2));
667       auto SuccessProb =
668           BranchProbabilityInfo::getBranchProbStackProtector(true);
669       auto FailureProb =
670           BranchProbabilityInfo::getBranchProbStackProtector(false);
671       MDNode *Weights = MDBuilder(F->getContext())
672                             .createBranchWeights(FailureProb.getNumerator(),
673                                                  SuccessProb.getNumerator());
674 
675       SplitBlockAndInsertIfThen(Cmp, CheckLoc,
676                                 /*Unreachable=*/false, Weights, DTU,
677                                 /*LI=*/nullptr, /*ThenBlock=*/FailBB);
678 
679       auto *BI = cast<BranchInst>(Cmp->getParent()->getTerminator());
680       BasicBlock *NewBB = BI->getSuccessor(1);
681       NewBB->setName("SP_return");
682       NewBB->moveAfter(&BB);
683 
684       Cmp->setPredicate(Cmp->getInversePredicate());
685       BI->swapSuccessors();
686     }
687   }
688 
689   // Return if we didn't modify any basic blocks. i.e., there are no return
690   // statements in the function.
691   return HasPrologue;
692 }
693 
694 BasicBlock *CreateFailBB(Function *F, const Triple &Trip) {
695   auto *M = F->getParent();
696   LLVMContext &Context = F->getContext();
697   BasicBlock *FailBB = BasicBlock::Create(Context, "CallStackCheckFailBlk", F);
698   IRBuilder<> B(FailBB);
699   if (F->getSubprogram())
700     B.SetCurrentDebugLocation(
701         DILocation::get(Context, 0, 0, F->getSubprogram()));
702   FunctionCallee StackChkFail;
703   SmallVector<Value *, 1> Args;
704   if (Trip.isOSOpenBSD()) {
705     StackChkFail = M->getOrInsertFunction("__stack_smash_handler",
706                                           Type::getVoidTy(Context),
707                                           PointerType::getUnqual(Context));
708     Args.push_back(B.CreateGlobalStringPtr(F->getName(), "SSH"));
709   } else {
710     StackChkFail =
711         M->getOrInsertFunction("__stack_chk_fail", Type::getVoidTy(Context));
712   }
713   cast<Function>(StackChkFail.getCallee())->addFnAttr(Attribute::NoReturn);
714   B.CreateCall(StackChkFail, Args);
715   B.CreateUnreachable();
716   return FailBB;
717 }
718