1 //==- UnreachableCodeChecker.cpp - Generalized dead code checker -*- C++ -*-==// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // This file implements a generalized unreachable code checker using a 9 // path-sensitive analysis. We mark any path visited, and then walk the CFG as a 10 // post-analysis to determine what was never visited. 11 // 12 // A similar flow-sensitive only check exists in Analysis/ReachableCode.cpp 13 //===----------------------------------------------------------------------===// 14 15 #include "clang/StaticAnalyzer/Checkers/BuiltinCheckerRegistration.h" 16 #include "clang/AST/ParentMap.h" 17 #include "clang/Basic/Builtins.h" 18 #include "clang/Basic/SourceManager.h" 19 #include "clang/StaticAnalyzer/Core/BugReporter/BugReporter.h" 20 #include "clang/StaticAnalyzer/Core/Checker.h" 21 #include "clang/StaticAnalyzer/Core/CheckerManager.h" 22 #include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h" 23 #include "clang/StaticAnalyzer/Core/PathSensitive/CheckerHelpers.h" 24 #include "clang/StaticAnalyzer/Core/PathSensitive/ExplodedGraph.h" 25 #include "clang/StaticAnalyzer/Core/PathSensitive/SVals.h" 26 #include "llvm/ADT/SmallSet.h" 27 #include <optional> 28 29 using namespace clang; 30 using namespace ento; 31 32 namespace { 33 class UnreachableCodeChecker : public Checker<check::EndAnalysis> { 34 public: 35 void checkEndAnalysis(ExplodedGraph &G, BugReporter &B, 36 ExprEngine &Eng) const; 37 private: 38 typedef llvm::SmallSet<unsigned, 32> CFGBlocksSet; 39 40 static inline const Stmt *getUnreachableStmt(const CFGBlock *CB); 41 static void FindUnreachableEntryPoints(const CFGBlock *CB, 42 CFGBlocksSet &reachable, 43 CFGBlocksSet &visited); 44 static bool isInvalidPath(const CFGBlock *CB, const ParentMap &PM); 45 static inline bool isEmptyCFGBlock(const CFGBlock *CB); 46 }; 47 } 48 49 void UnreachableCodeChecker::checkEndAnalysis(ExplodedGraph &G, 50 BugReporter &B, 51 ExprEngine &Eng) const { 52 CFGBlocksSet reachable, visited; 53 54 if (Eng.hasWorkRemaining()) 55 return; 56 57 const Decl *D = nullptr; 58 CFG *C = nullptr; 59 const ParentMap *PM = nullptr; 60 const LocationContext *LC = nullptr; 61 // Iterate over ExplodedGraph 62 for (const ExplodedNode &N : G.nodes()) { 63 const ProgramPoint &P = N.getLocation(); 64 LC = P.getLocationContext(); 65 if (!LC->inTopFrame()) 66 continue; 67 68 if (!D) 69 D = LC->getAnalysisDeclContext()->getDecl(); 70 71 // Save the CFG if we don't have it already 72 if (!C) 73 C = LC->getAnalysisDeclContext()->getUnoptimizedCFG(); 74 if (!PM) 75 PM = &LC->getParentMap(); 76 77 if (std::optional<BlockEntrance> BE = P.getAs<BlockEntrance>()) { 78 const CFGBlock *CB = BE->getBlock(); 79 reachable.insert(CB->getBlockID()); 80 } 81 } 82 83 // Bail out if we didn't get the CFG or the ParentMap. 84 if (!D || !C || !PM) 85 return; 86 87 // Don't do anything for template instantiations. Proving that code 88 // in a template instantiation is unreachable means proving that it is 89 // unreachable in all instantiations. 90 if (const FunctionDecl *FD = dyn_cast<FunctionDecl>(D)) 91 if (FD->isTemplateInstantiation()) 92 return; 93 94 // Find CFGBlocks that were not covered by any node 95 for (const CFGBlock *CB : *C) { 96 // Check if the block is unreachable 97 if (reachable.count(CB->getBlockID())) 98 continue; 99 100 // Check if the block is empty (an artificial block) 101 if (isEmptyCFGBlock(CB)) 102 continue; 103 104 // Find the entry points for this block 105 if (!visited.count(CB->getBlockID())) 106 FindUnreachableEntryPoints(CB, reachable, visited); 107 108 // This block may have been pruned; check if we still want to report it 109 if (reachable.count(CB->getBlockID())) 110 continue; 111 112 // Check for false positives 113 if (isInvalidPath(CB, *PM)) 114 continue; 115 116 // It is good practice to always have a "default" label in a "switch", even 117 // if we should never get there. It can be used to detect errors, for 118 // instance. Unreachable code directly under a "default" label is therefore 119 // likely to be a false positive. 120 if (const Stmt *label = CB->getLabel()) 121 if (label->getStmtClass() == Stmt::DefaultStmtClass) 122 continue; 123 124 // Special case for __builtin_unreachable. 125 // FIXME: This should be extended to include other unreachable markers, 126 // such as llvm_unreachable. 127 if (!CB->empty()) { 128 bool foundUnreachable = false; 129 for (CFGBlock::const_iterator ci = CB->begin(), ce = CB->end(); 130 ci != ce; ++ci) { 131 if (std::optional<CFGStmt> S = (*ci).getAs<CFGStmt>()) 132 if (const CallExpr *CE = dyn_cast<CallExpr>(S->getStmt())) { 133 if (CE->getBuiltinCallee() == Builtin::BI__builtin_unreachable || 134 CE->isBuiltinAssumeFalse(Eng.getContext())) { 135 foundUnreachable = true; 136 break; 137 } 138 } 139 } 140 if (foundUnreachable) 141 continue; 142 } 143 144 // We found a block that wasn't covered - find the statement to report 145 SourceRange SR; 146 PathDiagnosticLocation DL; 147 SourceLocation SL; 148 if (const Stmt *S = getUnreachableStmt(CB)) { 149 // In macros, 'do {...} while (0)' is often used. Don't warn about the 150 // condition 0 when it is unreachable. 151 if (S->getBeginLoc().isMacroID()) 152 if (const auto *I = dyn_cast<IntegerLiteral>(S)) 153 if (I->getValue() == 0ULL) 154 if (const Stmt *Parent = PM->getParent(S)) 155 if (isa<DoStmt>(Parent)) 156 continue; 157 SR = S->getSourceRange(); 158 DL = PathDiagnosticLocation::createBegin(S, B.getSourceManager(), LC); 159 SL = DL.asLocation(); 160 if (SR.isInvalid() || !SL.isValid()) 161 continue; 162 } 163 else 164 continue; 165 166 // Check if the SourceLocation is in a system header 167 const SourceManager &SM = B.getSourceManager(); 168 if (SM.isInSystemHeader(SL) || SM.isInExternCSystemHeader(SL)) 169 continue; 170 171 B.EmitBasicReport(D, this, "Unreachable code", categories::UnusedCode, 172 "This statement is never executed", DL, SR); 173 } 174 } 175 176 // Recursively finds the entry point(s) for this dead CFGBlock. 177 void UnreachableCodeChecker::FindUnreachableEntryPoints(const CFGBlock *CB, 178 CFGBlocksSet &reachable, 179 CFGBlocksSet &visited) { 180 visited.insert(CB->getBlockID()); 181 182 for (const CFGBlock *PredBlock : CB->preds()) { 183 if (!PredBlock) 184 continue; 185 186 if (!reachable.count(PredBlock->getBlockID())) { 187 // If we find an unreachable predecessor, mark this block as reachable so 188 // we don't report this block 189 reachable.insert(CB->getBlockID()); 190 if (!visited.count(PredBlock->getBlockID())) 191 // If we haven't previously visited the unreachable predecessor, recurse 192 FindUnreachableEntryPoints(PredBlock, reachable, visited); 193 } 194 } 195 } 196 197 // Find the Stmt* in a CFGBlock for reporting a warning 198 const Stmt *UnreachableCodeChecker::getUnreachableStmt(const CFGBlock *CB) { 199 for (const CFGElement &Elem : *CB) { 200 if (std::optional<CFGStmt> S = Elem.getAs<CFGStmt>()) { 201 if (!isa<DeclStmt>(S->getStmt())) 202 return S->getStmt(); 203 } 204 } 205 return CB->getTerminatorStmt(); 206 } 207 208 // Determines if the path to this CFGBlock contained an element that infers this 209 // block is a false positive. We assume that FindUnreachableEntryPoints has 210 // already marked only the entry points to any dead code, so we need only to 211 // find the condition that led to this block (the predecessor of this block.) 212 // There will never be more than one predecessor. 213 bool UnreachableCodeChecker::isInvalidPath(const CFGBlock *CB, 214 const ParentMap &PM) { 215 // We only expect a predecessor size of 0 or 1. If it is >1, then an external 216 // condition has broken our assumption (for example, a sink being placed by 217 // another check). In these cases, we choose not to report. 218 if (CB->pred_size() > 1) 219 return true; 220 221 // If there are no predecessors, then this block is trivially unreachable 222 if (CB->pred_size() == 0) 223 return false; 224 225 const CFGBlock *pred = *CB->pred_begin(); 226 if (!pred) 227 return false; 228 229 // Get the predecessor block's terminator condition 230 const Stmt *cond = pred->getTerminatorCondition(); 231 232 //assert(cond && "CFGBlock's predecessor has a terminator condition"); 233 // The previous assertion is invalid in some cases (eg do/while). Leaving 234 // reporting of these situations on at the moment to help triage these cases. 235 if (!cond) 236 return false; 237 238 // Run each of the checks on the conditions 239 return containsMacro(cond) || containsEnum(cond) || 240 containsStaticLocal(cond) || containsBuiltinOffsetOf(cond) || 241 containsStmt<UnaryExprOrTypeTraitExpr>(cond); 242 } 243 244 // Returns true if the given CFGBlock is empty 245 bool UnreachableCodeChecker::isEmptyCFGBlock(const CFGBlock *CB) { 246 return CB->getLabel() == nullptr // No labels 247 && CB->size() == 0 // No statements 248 && !CB->getTerminatorStmt(); // No terminator 249 } 250 251 void ento::registerUnreachableCodeChecker(CheckerManager &mgr) { 252 mgr.registerChecker<UnreachableCodeChecker>(); 253 } 254 255 bool ento::shouldRegisterUnreachableCodeChecker(const CheckerManager &mgr) { 256 return true; 257 } 258