1 //== ValistChecker.cpp - stdarg.h macro usage checker -----------*- C++ -*--==// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This defines checkers which detect usage of uninitialized va_list values 10 // and va_start calls with no matching va_end. 11 // 12 //===----------------------------------------------------------------------===// 13 14 #include "clang/StaticAnalyzer/Checkers/BuiltinCheckerRegistration.h" 15 #include "clang/StaticAnalyzer/Core/BugReporter/BugType.h" 16 #include "clang/StaticAnalyzer/Core/Checker.h" 17 #include "clang/StaticAnalyzer/Core/CheckerManager.h" 18 #include "clang/StaticAnalyzer/Core/PathSensitive/CallDescription.h" 19 #include "clang/StaticAnalyzer/Core/PathSensitive/CallEvent.h" 20 #include "clang/StaticAnalyzer/Core/PathSensitive/CheckerContext.h" 21 22 using namespace clang; 23 using namespace ento; 24 25 REGISTER_SET_WITH_PROGRAMSTATE(InitializedVALists, const MemRegion *) 26 27 namespace { 28 typedef SmallVector<const MemRegion *, 2> RegionVector; 29 30 class ValistChecker : public Checker<check::PreCall, check::PreStmt<VAArgExpr>, 31 check::DeadSymbols> { 32 mutable std::unique_ptr<BugType> BT_leakedvalist, BT_uninitaccess; 33 34 struct VAListAccepter { 35 CallDescription Func; 36 int VAListPos; 37 }; 38 static const SmallVector<VAListAccepter, 15> VAListAccepters; 39 static const CallDescription VaStart, VaEnd, VaCopy; 40 41 public: 42 enum CheckKind { 43 CK_Uninitialized, 44 CK_Unterminated, 45 CK_CopyToSelf, 46 CK_NumCheckKinds 47 }; 48 49 DefaultBool ChecksEnabled[CK_NumCheckKinds]; 50 CheckerNameRef CheckNames[CK_NumCheckKinds]; 51 52 void checkPreStmt(const VAArgExpr *VAA, CheckerContext &C) const; 53 void checkPreCall(const CallEvent &Call, CheckerContext &C) const; 54 void checkDeadSymbols(SymbolReaper &SR, CheckerContext &C) const; 55 56 private: 57 const MemRegion *getVAListAsRegion(SVal SV, const Expr *VAExpr, 58 bool &IsSymbolic, CheckerContext &C) const; 59 const ExplodedNode *getStartCallSite(const ExplodedNode *N, 60 const MemRegion *Reg) const; 61 62 void reportUninitializedAccess(const MemRegion *VAList, StringRef Msg, 63 CheckerContext &C) const; 64 void reportLeakedVALists(const RegionVector &LeakedVALists, StringRef Msg1, 65 StringRef Msg2, CheckerContext &C, ExplodedNode *N, 66 bool ReportUninit = false) const; 67 68 void checkVAListStartCall(const CallEvent &Call, CheckerContext &C, 69 bool IsCopy) const; 70 void checkVAListEndCall(const CallEvent &Call, CheckerContext &C) const; 71 72 class ValistBugVisitor : public BugReporterVisitor { 73 public: 74 ValistBugVisitor(const MemRegion *Reg, bool IsLeak = false) 75 : Reg(Reg), IsLeak(IsLeak) {} 76 void Profile(llvm::FoldingSetNodeID &ID) const override { 77 static int X = 0; 78 ID.AddPointer(&X); 79 ID.AddPointer(Reg); 80 } 81 PathDiagnosticPieceRef getEndPath(BugReporterContext &BRC, 82 const ExplodedNode *EndPathNode, 83 PathSensitiveBugReport &BR) override { 84 if (!IsLeak) 85 return nullptr; 86 87 PathDiagnosticLocation L = BR.getLocation(); 88 // Do not add the statement itself as a range in case of leak. 89 return std::make_shared<PathDiagnosticEventPiece>(L, BR.getDescription(), 90 false); 91 } 92 PathDiagnosticPieceRef VisitNode(const ExplodedNode *N, 93 BugReporterContext &BRC, 94 PathSensitiveBugReport &BR) override; 95 96 private: 97 const MemRegion *Reg; 98 bool IsLeak; 99 }; 100 }; 101 102 const SmallVector<ValistChecker::VAListAccepter, 15> 103 ValistChecker::VAListAccepters = { 104 {{"vfprintf", 3}, 2}, 105 {{"vfscanf", 3}, 2}, 106 {{"vprintf", 2}, 1}, 107 {{"vscanf", 2}, 1}, 108 {{"vsnprintf", 4}, 3}, 109 {{"vsprintf", 3}, 2}, 110 {{"vsscanf", 3}, 2}, 111 {{"vfwprintf", 3}, 2}, 112 {{"vfwscanf", 3}, 2}, 113 {{"vwprintf", 2}, 1}, 114 {{"vwscanf", 2}, 1}, 115 {{"vswprintf", 4}, 3}, 116 // vswprintf is the wide version of vsnprintf, 117 // vsprintf has no wide version 118 {{"vswscanf", 3}, 2}}; 119 120 const CallDescription 121 ValistChecker::VaStart("__builtin_va_start", /*Args=*/2, /*Params=*/1), 122 ValistChecker::VaCopy("__builtin_va_copy", 2), 123 ValistChecker::VaEnd("__builtin_va_end", 1); 124 } // end anonymous namespace 125 126 void ValistChecker::checkPreCall(const CallEvent &Call, 127 CheckerContext &C) const { 128 if (!Call.isGlobalCFunction()) 129 return; 130 if (VaStart.matches(Call)) 131 checkVAListStartCall(Call, C, false); 132 else if (VaCopy.matches(Call)) 133 checkVAListStartCall(Call, C, true); 134 else if (VaEnd.matches(Call)) 135 checkVAListEndCall(Call, C); 136 else { 137 for (auto FuncInfo : VAListAccepters) { 138 if (!FuncInfo.Func.matches(Call)) 139 continue; 140 bool Symbolic; 141 const MemRegion *VAList = 142 getVAListAsRegion(Call.getArgSVal(FuncInfo.VAListPos), 143 Call.getArgExpr(FuncInfo.VAListPos), Symbolic, C); 144 if (!VAList) 145 return; 146 147 if (C.getState()->contains<InitializedVALists>(VAList)) 148 return; 149 150 // We did not see va_start call, but the source of the region is unknown. 151 // Be conservative and assume the best. 152 if (Symbolic) 153 return; 154 155 SmallString<80> Errmsg("Function '"); 156 Errmsg += FuncInfo.Func.getFunctionName(); 157 Errmsg += "' is called with an uninitialized va_list argument"; 158 reportUninitializedAccess(VAList, Errmsg.c_str(), C); 159 break; 160 } 161 } 162 } 163 164 const MemRegion *ValistChecker::getVAListAsRegion(SVal SV, const Expr *E, 165 bool &IsSymbolic, 166 CheckerContext &C) const { 167 const MemRegion *Reg = SV.getAsRegion(); 168 if (!Reg) 169 return nullptr; 170 // TODO: In the future this should be abstracted away by the analyzer. 171 bool VaListModelledAsArray = false; 172 if (const auto *Cast = dyn_cast<CastExpr>(E)) { 173 QualType Ty = Cast->getType(); 174 VaListModelledAsArray = 175 Ty->isPointerType() && Ty->getPointeeType()->isRecordType(); 176 } 177 if (const auto *DeclReg = Reg->getAs<DeclRegion>()) { 178 if (isa<ParmVarDecl>(DeclReg->getDecl())) 179 Reg = C.getState()->getSVal(SV.castAs<Loc>()).getAsRegion(); 180 } 181 IsSymbolic = Reg && Reg->getAs<SymbolicRegion>(); 182 // Some VarRegion based VA lists reach here as ElementRegions. 183 const auto *EReg = dyn_cast_or_null<ElementRegion>(Reg); 184 return (EReg && VaListModelledAsArray) ? EReg->getSuperRegion() : Reg; 185 } 186 187 void ValistChecker::checkPreStmt(const VAArgExpr *VAA, 188 CheckerContext &C) const { 189 ProgramStateRef State = C.getState(); 190 const Expr *VASubExpr = VAA->getSubExpr(); 191 SVal VAListSVal = C.getSVal(VASubExpr); 192 bool Symbolic; 193 const MemRegion *VAList = 194 getVAListAsRegion(VAListSVal, VASubExpr, Symbolic, C); 195 if (!VAList) 196 return; 197 if (Symbolic) 198 return; 199 if (!State->contains<InitializedVALists>(VAList)) 200 reportUninitializedAccess( 201 VAList, "va_arg() is called on an uninitialized va_list", C); 202 } 203 204 void ValistChecker::checkDeadSymbols(SymbolReaper &SR, 205 CheckerContext &C) const { 206 ProgramStateRef State = C.getState(); 207 InitializedVAListsTy TrackedVALists = State->get<InitializedVALists>(); 208 RegionVector LeakedVALists; 209 for (auto Reg : TrackedVALists) { 210 if (SR.isLiveRegion(Reg)) 211 continue; 212 LeakedVALists.push_back(Reg); 213 State = State->remove<InitializedVALists>(Reg); 214 } 215 if (ExplodedNode *N = C.addTransition(State)) 216 reportLeakedVALists(LeakedVALists, "Initialized va_list", " is leaked", C, 217 N); 218 } 219 220 // This function traverses the exploded graph backwards and finds the node where 221 // the va_list is initialized. That node is used for uniquing the bug paths. 222 // It is not likely that there are several different va_lists that belongs to 223 // different stack frames, so that case is not yet handled. 224 const ExplodedNode * 225 ValistChecker::getStartCallSite(const ExplodedNode *N, 226 const MemRegion *Reg) const { 227 const LocationContext *LeakContext = N->getLocationContext(); 228 const ExplodedNode *StartCallNode = N; 229 230 bool FoundInitializedState = false; 231 232 while (N) { 233 ProgramStateRef State = N->getState(); 234 if (!State->contains<InitializedVALists>(Reg)) { 235 if (FoundInitializedState) 236 break; 237 } else { 238 FoundInitializedState = true; 239 } 240 const LocationContext *NContext = N->getLocationContext(); 241 if (NContext == LeakContext || NContext->isParentOf(LeakContext)) 242 StartCallNode = N; 243 N = N->pred_empty() ? nullptr : *(N->pred_begin()); 244 } 245 246 return StartCallNode; 247 } 248 249 void ValistChecker::reportUninitializedAccess(const MemRegion *VAList, 250 StringRef Msg, 251 CheckerContext &C) const { 252 if (!ChecksEnabled[CK_Uninitialized]) 253 return; 254 if (ExplodedNode *N = C.generateErrorNode()) { 255 if (!BT_uninitaccess) 256 BT_uninitaccess.reset(new BugType(CheckNames[CK_Uninitialized], 257 "Uninitialized va_list", 258 categories::MemoryError)); 259 auto R = std::make_unique<PathSensitiveBugReport>(*BT_uninitaccess, Msg, N); 260 R->markInteresting(VAList); 261 R->addVisitor(std::make_unique<ValistBugVisitor>(VAList)); 262 C.emitReport(std::move(R)); 263 } 264 } 265 266 void ValistChecker::reportLeakedVALists(const RegionVector &LeakedVALists, 267 StringRef Msg1, StringRef Msg2, 268 CheckerContext &C, ExplodedNode *N, 269 bool ReportUninit) const { 270 if (!(ChecksEnabled[CK_Unterminated] || 271 (ChecksEnabled[CK_Uninitialized] && ReportUninit))) 272 return; 273 for (auto Reg : LeakedVALists) { 274 if (!BT_leakedvalist) { 275 // FIXME: maybe creating a new check name for this type of bug is a better 276 // solution. 277 BT_leakedvalist.reset( 278 new BugType(CheckNames[CK_Unterminated].getName().empty() 279 ? CheckNames[CK_Uninitialized] 280 : CheckNames[CK_Unterminated], 281 "Leaked va_list", categories::MemoryError, 282 /*SuppressOnSink=*/true)); 283 } 284 285 const ExplodedNode *StartNode = getStartCallSite(N, Reg); 286 PathDiagnosticLocation LocUsedForUniqueing; 287 288 if (const Stmt *StartCallStmt = StartNode->getStmtForDiagnostics()) 289 LocUsedForUniqueing = PathDiagnosticLocation::createBegin( 290 StartCallStmt, C.getSourceManager(), StartNode->getLocationContext()); 291 292 SmallString<100> Buf; 293 llvm::raw_svector_ostream OS(Buf); 294 OS << Msg1; 295 std::string VariableName = Reg->getDescriptiveName(); 296 if (!VariableName.empty()) 297 OS << " " << VariableName; 298 OS << Msg2; 299 300 auto R = std::make_unique<PathSensitiveBugReport>( 301 *BT_leakedvalist, OS.str(), N, LocUsedForUniqueing, 302 StartNode->getLocationContext()->getDecl()); 303 R->markInteresting(Reg); 304 R->addVisitor(std::make_unique<ValistBugVisitor>(Reg, true)); 305 C.emitReport(std::move(R)); 306 } 307 } 308 309 void ValistChecker::checkVAListStartCall(const CallEvent &Call, 310 CheckerContext &C, bool IsCopy) const { 311 bool Symbolic; 312 const MemRegion *VAList = 313 getVAListAsRegion(Call.getArgSVal(0), Call.getArgExpr(0), Symbolic, C); 314 if (!VAList) 315 return; 316 317 ProgramStateRef State = C.getState(); 318 319 if (IsCopy) { 320 const MemRegion *Arg2 = 321 getVAListAsRegion(Call.getArgSVal(1), Call.getArgExpr(1), Symbolic, C); 322 if (Arg2) { 323 if (ChecksEnabled[CK_CopyToSelf] && VAList == Arg2) { 324 RegionVector LeakedVALists{VAList}; 325 if (ExplodedNode *N = C.addTransition(State)) 326 reportLeakedVALists(LeakedVALists, "va_list", 327 " is copied onto itself", C, N, true); 328 return; 329 } else if (!State->contains<InitializedVALists>(Arg2) && !Symbolic) { 330 if (State->contains<InitializedVALists>(VAList)) { 331 State = State->remove<InitializedVALists>(VAList); 332 RegionVector LeakedVALists{VAList}; 333 if (ExplodedNode *N = C.addTransition(State)) 334 reportLeakedVALists(LeakedVALists, "Initialized va_list", 335 " is overwritten by an uninitialized one", C, N, 336 true); 337 } else { 338 reportUninitializedAccess(Arg2, "Uninitialized va_list is copied", C); 339 } 340 return; 341 } 342 } 343 } 344 if (State->contains<InitializedVALists>(VAList)) { 345 RegionVector LeakedVALists{VAList}; 346 if (ExplodedNode *N = C.addTransition(State)) 347 reportLeakedVALists(LeakedVALists, "Initialized va_list", 348 " is initialized again", C, N); 349 return; 350 } 351 352 State = State->add<InitializedVALists>(VAList); 353 C.addTransition(State); 354 } 355 356 void ValistChecker::checkVAListEndCall(const CallEvent &Call, 357 CheckerContext &C) const { 358 bool Symbolic; 359 const MemRegion *VAList = 360 getVAListAsRegion(Call.getArgSVal(0), Call.getArgExpr(0), Symbolic, C); 361 if (!VAList) 362 return; 363 364 // We did not see va_start call, but the source of the region is unknown. 365 // Be conservative and assume the best. 366 if (Symbolic) 367 return; 368 369 if (!C.getState()->contains<InitializedVALists>(VAList)) { 370 reportUninitializedAccess( 371 VAList, "va_end() is called on an uninitialized va_list", C); 372 return; 373 } 374 ProgramStateRef State = C.getState(); 375 State = State->remove<InitializedVALists>(VAList); 376 C.addTransition(State); 377 } 378 379 PathDiagnosticPieceRef ValistChecker::ValistBugVisitor::VisitNode( 380 const ExplodedNode *N, BugReporterContext &BRC, PathSensitiveBugReport &) { 381 ProgramStateRef State = N->getState(); 382 ProgramStateRef StatePrev = N->getFirstPred()->getState(); 383 384 const Stmt *S = N->getStmtForDiagnostics(); 385 if (!S) 386 return nullptr; 387 388 StringRef Msg; 389 if (State->contains<InitializedVALists>(Reg) && 390 !StatePrev->contains<InitializedVALists>(Reg)) 391 Msg = "Initialized va_list"; 392 else if (!State->contains<InitializedVALists>(Reg) && 393 StatePrev->contains<InitializedVALists>(Reg)) 394 Msg = "Ended va_list"; 395 396 if (Msg.empty()) 397 return nullptr; 398 399 PathDiagnosticLocation Pos(S, BRC.getSourceManager(), 400 N->getLocationContext()); 401 return std::make_shared<PathDiagnosticEventPiece>(Pos, Msg, true); 402 } 403 404 void ento::registerValistBase(CheckerManager &mgr) { 405 mgr.registerChecker<ValistChecker>(); 406 } 407 408 bool ento::shouldRegisterValistBase(const CheckerManager &mgr) { 409 return true; 410 } 411 412 #define REGISTER_CHECKER(name) \ 413 void ento::register##name##Checker(CheckerManager &mgr) { \ 414 ValistChecker *checker = mgr.getChecker<ValistChecker>(); \ 415 checker->ChecksEnabled[ValistChecker::CK_##name] = true; \ 416 checker->CheckNames[ValistChecker::CK_##name] = \ 417 mgr.getCurrentCheckerName(); \ 418 } \ 419 \ 420 bool ento::shouldRegister##name##Checker(const CheckerManager &mgr) { \ 421 return true; \ 422 } 423 424 REGISTER_CHECKER(Uninitialized) 425 REGISTER_CHECKER(Unterminated) 426 REGISTER_CHECKER(CopyToSelf) 427