1 //===----- CGCoroutine.cpp - Emit LLVM Code for C++ coroutines ------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This contains code dealing with C++ code generation of coroutines. 10 // 11 //===----------------------------------------------------------------------===// 12 13 #include "CGCleanup.h" 14 #include "CodeGenFunction.h" 15 #include "llvm/ADT/ScopeExit.h" 16 #include "clang/AST/StmtCXX.h" 17 #include "clang/AST/StmtVisitor.h" 18 19 using namespace clang; 20 using namespace CodeGen; 21 22 using llvm::Value; 23 using llvm::BasicBlock; 24 25 namespace { 26 enum class AwaitKind { Init, Normal, Yield, Final }; 27 static constexpr llvm::StringLiteral AwaitKindStr[] = {"init", "await", "yield", 28 "final"}; 29 } 30 31 struct clang::CodeGen::CGCoroData { 32 // What is the current await expression kind and how many 33 // await/yield expressions were encountered so far. 34 // These are used to generate pretty labels for await expressions in LLVM IR. 35 AwaitKind CurrentAwaitKind = AwaitKind::Init; 36 unsigned AwaitNum = 0; 37 unsigned YieldNum = 0; 38 39 // How many co_return statements are in the coroutine. Used to decide whether 40 // we need to add co_return; equivalent at the end of the user authored body. 41 unsigned CoreturnCount = 0; 42 43 // A branch to this block is emitted when coroutine needs to suspend. 44 llvm::BasicBlock *SuspendBB = nullptr; 45 46 // The promise type's 'unhandled_exception' handler, if it defines one. 47 Stmt *ExceptionHandler = nullptr; 48 49 // A temporary i1 alloca that stores whether 'await_resume' threw an 50 // exception. If it did, 'true' is stored in this variable, and the coroutine 51 // body must be skipped. If the promise type does not define an exception 52 // handler, this is null. 53 llvm::Value *ResumeEHVar = nullptr; 54 55 // Stores the jump destination just before the coroutine memory is freed. 56 // This is the destination that every suspend point jumps to for the cleanup 57 // branch. 58 CodeGenFunction::JumpDest CleanupJD; 59 60 // Stores the jump destination just before the final suspend. The co_return 61 // statements jumps to this point after calling return_xxx promise member. 62 CodeGenFunction::JumpDest FinalJD; 63 64 // Stores the llvm.coro.id emitted in the function so that we can supply it 65 // as the first argument to coro.begin, coro.alloc and coro.free intrinsics. 66 // Note: llvm.coro.id returns a token that cannot be directly expressed in a 67 // builtin. 68 llvm::CallInst *CoroId = nullptr; 69 70 // Stores the llvm.coro.begin emitted in the function so that we can replace 71 // all coro.frame intrinsics with direct SSA value of coro.begin that returns 72 // the address of the coroutine frame of the current coroutine. 73 llvm::CallInst *CoroBegin = nullptr; 74 75 // Stores the last emitted coro.free for the deallocate expressions, we use it 76 // to wrap dealloc code with if(auto mem = coro.free) dealloc(mem). 77 llvm::CallInst *LastCoroFree = nullptr; 78 79 // If coro.id came from the builtin, remember the expression to give better 80 // diagnostic. If CoroIdExpr is nullptr, the coro.id was created by 81 // EmitCoroutineBody. 82 CallExpr const *CoroIdExpr = nullptr; 83 }; 84 85 // Defining these here allows to keep CGCoroData private to this file. 86 clang::CodeGen::CodeGenFunction::CGCoroInfo::CGCoroInfo() {} 87 CodeGenFunction::CGCoroInfo::~CGCoroInfo() {} 88 89 static void createCoroData(CodeGenFunction &CGF, 90 CodeGenFunction::CGCoroInfo &CurCoro, 91 llvm::CallInst *CoroId, 92 CallExpr const *CoroIdExpr = nullptr) { 93 if (CurCoro.Data) { 94 if (CurCoro.Data->CoroIdExpr) 95 CGF.CGM.Error(CoroIdExpr->getBeginLoc(), 96 "only one __builtin_coro_id can be used in a function"); 97 else if (CoroIdExpr) 98 CGF.CGM.Error(CoroIdExpr->getBeginLoc(), 99 "__builtin_coro_id shall not be used in a C++ coroutine"); 100 else 101 llvm_unreachable("EmitCoroutineBodyStatement called twice?"); 102 103 return; 104 } 105 106 CurCoro.Data = std::unique_ptr<CGCoroData>(new CGCoroData); 107 CurCoro.Data->CoroId = CoroId; 108 CurCoro.Data->CoroIdExpr = CoroIdExpr; 109 } 110 111 // Synthesize a pretty name for a suspend point. 112 static SmallString<32> buildSuspendPrefixStr(CGCoroData &Coro, AwaitKind Kind) { 113 unsigned No = 0; 114 switch (Kind) { 115 case AwaitKind::Init: 116 case AwaitKind::Final: 117 break; 118 case AwaitKind::Normal: 119 No = ++Coro.AwaitNum; 120 break; 121 case AwaitKind::Yield: 122 No = ++Coro.YieldNum; 123 break; 124 } 125 SmallString<32> Prefix(AwaitKindStr[static_cast<unsigned>(Kind)]); 126 if (No > 1) { 127 Twine(No).toVector(Prefix); 128 } 129 return Prefix; 130 } 131 132 // Check if function can throw based on prototype noexcept, also works for 133 // destructors which are implicitly noexcept but can be marked noexcept(false). 134 static bool FunctionCanThrow(const FunctionDecl *D) { 135 const auto *Proto = D->getType()->getAs<FunctionProtoType>(); 136 if (!Proto) { 137 // Function proto is not found, we conservatively assume throwing. 138 return true; 139 } 140 return !isNoexceptExceptionSpec(Proto->getExceptionSpecType()) || 141 Proto->canThrow() != CT_Cannot; 142 } 143 144 static bool ResumeStmtCanThrow(const Stmt *S) { 145 if (const auto *CE = dyn_cast<CallExpr>(S)) { 146 const auto *Callee = CE->getDirectCallee(); 147 if (!Callee) 148 // We don't have direct callee. Conservatively assume throwing. 149 return true; 150 151 if (FunctionCanThrow(Callee)) 152 return true; 153 154 // Fall through to visit the children. 155 } 156 157 if (const auto *TE = dyn_cast<CXXBindTemporaryExpr>(S)) { 158 // Special handling of CXXBindTemporaryExpr here as calling of Dtor of the 159 // temporary is not part of `children()` as covered in the fall through. 160 // We need to mark entire statement as throwing if the destructor of the 161 // temporary throws. 162 const auto *Dtor = TE->getTemporary()->getDestructor(); 163 if (FunctionCanThrow(Dtor)) 164 return true; 165 166 // Fall through to visit the children. 167 } 168 169 for (const auto *child : S->children()) 170 if (ResumeStmtCanThrow(child)) 171 return true; 172 173 return false; 174 } 175 176 // Emit suspend expression which roughly looks like: 177 // 178 // auto && x = CommonExpr(); 179 // if (!x.await_ready()) { 180 // llvm_coro_save(); 181 // x.await_suspend(...); (*) 182 // llvm_coro_suspend(); (**) 183 // } 184 // x.await_resume(); 185 // 186 // where the result of the entire expression is the result of x.await_resume() 187 // 188 // (*) If x.await_suspend return type is bool, it allows to veto a suspend: 189 // if (x.await_suspend(...)) 190 // llvm_coro_suspend(); 191 // 192 // (**) llvm_coro_suspend() encodes three possible continuations as 193 // a switch instruction: 194 // 195 // %where-to = call i8 @llvm.coro.suspend(...) 196 // switch i8 %where-to, label %coro.ret [ ; jump to epilogue to suspend 197 // i8 0, label %yield.ready ; go here when resumed 198 // i8 1, label %yield.cleanup ; go here when destroyed 199 // ] 200 // 201 // See llvm's docs/Coroutines.rst for more details. 202 // 203 namespace { 204 struct LValueOrRValue { 205 LValue LV; 206 RValue RV; 207 }; 208 } 209 static LValueOrRValue emitSuspendExpression(CodeGenFunction &CGF, CGCoroData &Coro, 210 CoroutineSuspendExpr const &S, 211 AwaitKind Kind, AggValueSlot aggSlot, 212 bool ignoreResult, bool forLValue) { 213 auto *E = S.getCommonExpr(); 214 215 auto Binder = 216 CodeGenFunction::OpaqueValueMappingData::bind(CGF, S.getOpaqueValue(), E); 217 auto UnbindOnExit = llvm::make_scope_exit([&] { Binder.unbind(CGF); }); 218 219 auto Prefix = buildSuspendPrefixStr(Coro, Kind); 220 BasicBlock *ReadyBlock = CGF.createBasicBlock(Prefix + Twine(".ready")); 221 BasicBlock *SuspendBlock = CGF.createBasicBlock(Prefix + Twine(".suspend")); 222 BasicBlock *CleanupBlock = CGF.createBasicBlock(Prefix + Twine(".cleanup")); 223 224 // If expression is ready, no need to suspend. 225 CGF.EmitBranchOnBoolExpr(S.getReadyExpr(), ReadyBlock, SuspendBlock, 0); 226 227 // Otherwise, emit suspend logic. 228 CGF.EmitBlock(SuspendBlock); 229 230 auto &Builder = CGF.Builder; 231 llvm::Function *CoroSave = CGF.CGM.getIntrinsic(llvm::Intrinsic::coro_save); 232 auto *NullPtr = llvm::ConstantPointerNull::get(CGF.CGM.Int8PtrTy); 233 auto *SaveCall = Builder.CreateCall(CoroSave, {NullPtr}); 234 235 CGF.CurCoro.InSuspendBlock = true; 236 auto *SuspendRet = CGF.EmitScalarExpr(S.getSuspendExpr()); 237 CGF.CurCoro.InSuspendBlock = false; 238 239 if (SuspendRet != nullptr && SuspendRet->getType()->isIntegerTy(1)) { 240 // Veto suspension if requested by bool returning await_suspend. 241 BasicBlock *RealSuspendBlock = 242 CGF.createBasicBlock(Prefix + Twine(".suspend.bool")); 243 CGF.Builder.CreateCondBr(SuspendRet, RealSuspendBlock, ReadyBlock); 244 CGF.EmitBlock(RealSuspendBlock); 245 } 246 247 // Emit the suspend point. 248 const bool IsFinalSuspend = (Kind == AwaitKind::Final); 249 llvm::Function *CoroSuspend = 250 CGF.CGM.getIntrinsic(llvm::Intrinsic::coro_suspend); 251 auto *SuspendResult = Builder.CreateCall( 252 CoroSuspend, {SaveCall, Builder.getInt1(IsFinalSuspend)}); 253 254 // Create a switch capturing three possible continuations. 255 auto *Switch = Builder.CreateSwitch(SuspendResult, Coro.SuspendBB, 2); 256 Switch->addCase(Builder.getInt8(0), ReadyBlock); 257 Switch->addCase(Builder.getInt8(1), CleanupBlock); 258 259 // Emit cleanup for this suspend point. 260 CGF.EmitBlock(CleanupBlock); 261 CGF.EmitBranchThroughCleanup(Coro.CleanupJD); 262 263 // Emit await_resume expression. 264 CGF.EmitBlock(ReadyBlock); 265 266 // Exception handling requires additional IR. If the 'await_resume' function 267 // is marked as 'noexcept', we avoid generating this additional IR. 268 CXXTryStmt *TryStmt = nullptr; 269 if (Coro.ExceptionHandler && Kind == AwaitKind::Init && 270 ResumeStmtCanThrow(S.getResumeExpr())) { 271 Coro.ResumeEHVar = 272 CGF.CreateTempAlloca(Builder.getInt1Ty(), Prefix + Twine("resume.eh")); 273 Builder.CreateFlagStore(true, Coro.ResumeEHVar); 274 275 auto Loc = S.getResumeExpr()->getExprLoc(); 276 auto *Catch = new (CGF.getContext()) 277 CXXCatchStmt(Loc, /*exDecl=*/nullptr, Coro.ExceptionHandler); 278 auto *TryBody = CompoundStmt::Create(CGF.getContext(), S.getResumeExpr(), 279 FPOptionsOverride(), Loc, Loc); 280 TryStmt = CXXTryStmt::Create(CGF.getContext(), Loc, TryBody, Catch); 281 CGF.EnterCXXTryStmt(*TryStmt); 282 CGF.EmitStmt(TryBody); 283 // We don't use EmitCXXTryStmt here. We need to store to ResumeEHVar that 284 // doesn't exist in the body. 285 Builder.CreateFlagStore(false, Coro.ResumeEHVar); 286 CGF.ExitCXXTryStmt(*TryStmt); 287 LValueOrRValue Res; 288 // We are not supposed to obtain the value from init suspend await_resume(). 289 Res.RV = RValue::getIgnored(); 290 return Res; 291 } 292 293 LValueOrRValue Res; 294 if (forLValue) 295 Res.LV = CGF.EmitLValue(S.getResumeExpr()); 296 else 297 Res.RV = CGF.EmitAnyExpr(S.getResumeExpr(), aggSlot, ignoreResult); 298 299 return Res; 300 } 301 302 RValue CodeGenFunction::EmitCoawaitExpr(const CoawaitExpr &E, 303 AggValueSlot aggSlot, 304 bool ignoreResult) { 305 return emitSuspendExpression(*this, *CurCoro.Data, E, 306 CurCoro.Data->CurrentAwaitKind, aggSlot, 307 ignoreResult, /*forLValue*/false).RV; 308 } 309 RValue CodeGenFunction::EmitCoyieldExpr(const CoyieldExpr &E, 310 AggValueSlot aggSlot, 311 bool ignoreResult) { 312 return emitSuspendExpression(*this, *CurCoro.Data, E, AwaitKind::Yield, 313 aggSlot, ignoreResult, /*forLValue*/false).RV; 314 } 315 316 void CodeGenFunction::EmitCoreturnStmt(CoreturnStmt const &S) { 317 ++CurCoro.Data->CoreturnCount; 318 const Expr *RV = S.getOperand(); 319 if (RV && RV->getType()->isVoidType() && !isa<InitListExpr>(RV)) { 320 // Make sure to evaluate the non initlist expression of a co_return 321 // with a void expression for side effects. 322 RunCleanupsScope cleanupScope(*this); 323 EmitIgnoredExpr(RV); 324 } 325 EmitStmt(S.getPromiseCall()); 326 EmitBranchThroughCleanup(CurCoro.Data->FinalJD); 327 } 328 329 330 #ifndef NDEBUG 331 static QualType getCoroutineSuspendExprReturnType(const ASTContext &Ctx, 332 const CoroutineSuspendExpr *E) { 333 const auto *RE = E->getResumeExpr(); 334 // Is it possible for RE to be a CXXBindTemporaryExpr wrapping 335 // a MemberCallExpr? 336 assert(isa<CallExpr>(RE) && "unexpected suspend expression type"); 337 return cast<CallExpr>(RE)->getCallReturnType(Ctx); 338 } 339 #endif 340 341 LValue 342 CodeGenFunction::EmitCoawaitLValue(const CoawaitExpr *E) { 343 assert(getCoroutineSuspendExprReturnType(getContext(), E)->isReferenceType() && 344 "Can't have a scalar return unless the return type is a " 345 "reference type!"); 346 return emitSuspendExpression(*this, *CurCoro.Data, *E, 347 CurCoro.Data->CurrentAwaitKind, AggValueSlot::ignored(), 348 /*ignoreResult*/false, /*forLValue*/true).LV; 349 } 350 351 LValue 352 CodeGenFunction::EmitCoyieldLValue(const CoyieldExpr *E) { 353 assert(getCoroutineSuspendExprReturnType(getContext(), E)->isReferenceType() && 354 "Can't have a scalar return unless the return type is a " 355 "reference type!"); 356 return emitSuspendExpression(*this, *CurCoro.Data, *E, 357 AwaitKind::Yield, AggValueSlot::ignored(), 358 /*ignoreResult*/false, /*forLValue*/true).LV; 359 } 360 361 // Hunts for the parameter reference in the parameter copy/move declaration. 362 namespace { 363 struct GetParamRef : public StmtVisitor<GetParamRef> { 364 public: 365 DeclRefExpr *Expr = nullptr; 366 GetParamRef() {} 367 void VisitDeclRefExpr(DeclRefExpr *E) { 368 assert(Expr == nullptr && "multilple declref in param move"); 369 Expr = E; 370 } 371 void VisitStmt(Stmt *S) { 372 for (auto *C : S->children()) { 373 if (C) 374 Visit(C); 375 } 376 } 377 }; 378 } 379 380 // This class replaces references to parameters to their copies by changing 381 // the addresses in CGF.LocalDeclMap and restoring back the original values in 382 // its destructor. 383 384 namespace { 385 struct ParamReferenceReplacerRAII { 386 CodeGenFunction::DeclMapTy SavedLocals; 387 CodeGenFunction::DeclMapTy& LocalDeclMap; 388 389 ParamReferenceReplacerRAII(CodeGenFunction::DeclMapTy &LocalDeclMap) 390 : LocalDeclMap(LocalDeclMap) {} 391 392 void addCopy(DeclStmt const *PM) { 393 // Figure out what param it refers to. 394 395 assert(PM->isSingleDecl()); 396 VarDecl const*VD = static_cast<VarDecl const*>(PM->getSingleDecl()); 397 Expr const *InitExpr = VD->getInit(); 398 GetParamRef Visitor; 399 Visitor.Visit(const_cast<Expr*>(InitExpr)); 400 assert(Visitor.Expr); 401 DeclRefExpr *DREOrig = Visitor.Expr; 402 auto *PD = DREOrig->getDecl(); 403 404 auto it = LocalDeclMap.find(PD); 405 assert(it != LocalDeclMap.end() && "parameter is not found"); 406 SavedLocals.insert({ PD, it->second }); 407 408 auto copyIt = LocalDeclMap.find(VD); 409 assert(copyIt != LocalDeclMap.end() && "parameter copy is not found"); 410 it->second = copyIt->getSecond(); 411 } 412 413 ~ParamReferenceReplacerRAII() { 414 for (auto&& SavedLocal : SavedLocals) { 415 LocalDeclMap.insert({SavedLocal.first, SavedLocal.second}); 416 } 417 } 418 }; 419 } 420 421 // For WinEH exception representation backend needs to know what funclet coro.end 422 // belongs to. That information is passed in a funclet bundle. 423 static SmallVector<llvm::OperandBundleDef, 1> 424 getBundlesForCoroEnd(CodeGenFunction &CGF) { 425 SmallVector<llvm::OperandBundleDef, 1> BundleList; 426 427 if (llvm::Instruction *EHPad = CGF.CurrentFuncletPad) 428 BundleList.emplace_back("funclet", EHPad); 429 430 return BundleList; 431 } 432 433 namespace { 434 // We will insert coro.end to cut any of the destructors for objects that 435 // do not need to be destroyed once the coroutine is resumed. 436 // See llvm/docs/Coroutines.rst for more details about coro.end. 437 struct CallCoroEnd final : public EHScopeStack::Cleanup { 438 void Emit(CodeGenFunction &CGF, Flags flags) override { 439 auto &CGM = CGF.CGM; 440 auto *NullPtr = llvm::ConstantPointerNull::get(CGF.Int8PtrTy); 441 llvm::Function *CoroEndFn = CGM.getIntrinsic(llvm::Intrinsic::coro_end); 442 // See if we have a funclet bundle to associate coro.end with. (WinEH) 443 auto Bundles = getBundlesForCoroEnd(CGF); 444 auto *CoroEnd = 445 CGF.Builder.CreateCall(CoroEndFn, 446 {NullPtr, CGF.Builder.getTrue(), 447 llvm::ConstantTokenNone::get(CoroEndFn->getContext())}, 448 Bundles); 449 if (Bundles.empty()) { 450 // Otherwise, (landingpad model), create a conditional branch that leads 451 // either to a cleanup block or a block with EH resume instruction. 452 auto *ResumeBB = CGF.getEHResumeBlock(/*isCleanup=*/true); 453 auto *CleanupContBB = CGF.createBasicBlock("cleanup.cont"); 454 CGF.Builder.CreateCondBr(CoroEnd, ResumeBB, CleanupContBB); 455 CGF.EmitBlock(CleanupContBB); 456 } 457 } 458 }; 459 } 460 461 namespace { 462 // Make sure to call coro.delete on scope exit. 463 struct CallCoroDelete final : public EHScopeStack::Cleanup { 464 Stmt *Deallocate; 465 466 // Emit "if (coro.free(CoroId, CoroBegin)) Deallocate;" 467 468 // Note: That deallocation will be emitted twice: once for a normal exit and 469 // once for exceptional exit. This usage is safe because Deallocate does not 470 // contain any declarations. The SubStmtBuilder::makeNewAndDeleteExpr() 471 // builds a single call to a deallocation function which is safe to emit 472 // multiple times. 473 void Emit(CodeGenFunction &CGF, Flags) override { 474 // Remember the current point, as we are going to emit deallocation code 475 // first to get to coro.free instruction that is an argument to a delete 476 // call. 477 BasicBlock *SaveInsertBlock = CGF.Builder.GetInsertBlock(); 478 479 auto *FreeBB = CGF.createBasicBlock("coro.free"); 480 CGF.EmitBlock(FreeBB); 481 CGF.EmitStmt(Deallocate); 482 483 auto *AfterFreeBB = CGF.createBasicBlock("after.coro.free"); 484 CGF.EmitBlock(AfterFreeBB); 485 486 // We should have captured coro.free from the emission of deallocate. 487 auto *CoroFree = CGF.CurCoro.Data->LastCoroFree; 488 if (!CoroFree) { 489 CGF.CGM.Error(Deallocate->getBeginLoc(), 490 "Deallocation expressoin does not refer to coro.free"); 491 return; 492 } 493 494 // Get back to the block we were originally and move coro.free there. 495 auto *InsertPt = SaveInsertBlock->getTerminator(); 496 CoroFree->moveBefore(InsertPt); 497 CGF.Builder.SetInsertPoint(InsertPt); 498 499 // Add if (auto *mem = coro.free) Deallocate; 500 auto *NullPtr = llvm::ConstantPointerNull::get(CGF.Int8PtrTy); 501 auto *Cond = CGF.Builder.CreateICmpNE(CoroFree, NullPtr); 502 CGF.Builder.CreateCondBr(Cond, FreeBB, AfterFreeBB); 503 504 // No longer need old terminator. 505 InsertPt->eraseFromParent(); 506 CGF.Builder.SetInsertPoint(AfterFreeBB); 507 } 508 explicit CallCoroDelete(Stmt *DeallocStmt) : Deallocate(DeallocStmt) {} 509 }; 510 } 511 512 namespace { 513 struct GetReturnObjectManager { 514 CodeGenFunction &CGF; 515 CGBuilderTy &Builder; 516 const CoroutineBodyStmt &S; 517 // When true, performs RVO for the return object. 518 bool DirectEmit = false; 519 520 Address GroActiveFlag; 521 CodeGenFunction::AutoVarEmission GroEmission; 522 523 GetReturnObjectManager(CodeGenFunction &CGF, const CoroutineBodyStmt &S) 524 : CGF(CGF), Builder(CGF.Builder), S(S), GroActiveFlag(Address::invalid()), 525 GroEmission(CodeGenFunction::AutoVarEmission::invalid()) { 526 // The call to get_return_object is sequenced before the call to 527 // initial_suspend and is invoked at most once, but there are caveats 528 // regarding on whether the prvalue result object may be initialized 529 // directly/eager or delayed, depending on the types involved. 530 // 531 // More info at https://github.com/cplusplus/papers/issues/1414 532 // 533 // The general cases: 534 // 1. Same type of get_return_object and coroutine return type (direct 535 // emission): 536 // - Constructed in the return slot. 537 // 2. Different types (delayed emission): 538 // - Constructed temporary object prior to initial suspend initialized with 539 // a call to get_return_object() 540 // - When coroutine needs to to return to the caller and needs to construct 541 // return value for the coroutine it is initialized with expiring value of 542 // the temporary obtained above. 543 // 544 // Direct emission for void returning coroutines or GROs. 545 DirectEmit = [&]() { 546 auto *RVI = S.getReturnValueInit(); 547 assert(RVI && "expected RVI"); 548 auto GroType = RVI->getType(); 549 return CGF.getContext().hasSameType(GroType, CGF.FnRetTy); 550 }(); 551 } 552 553 // The gro variable has to outlive coroutine frame and coroutine promise, but, 554 // it can only be initialized after coroutine promise was created, thus, we 555 // split its emission in two parts. EmitGroAlloca emits an alloca and sets up 556 // cleanups. Later when coroutine promise is available we initialize the gro 557 // and sets the flag that the cleanup is now active. 558 void EmitGroAlloca() { 559 if (DirectEmit) 560 return; 561 562 auto *GroDeclStmt = dyn_cast_or_null<DeclStmt>(S.getResultDecl()); 563 if (!GroDeclStmt) { 564 // If get_return_object returns void, no need to do an alloca. 565 return; 566 } 567 568 auto *GroVarDecl = cast<VarDecl>(GroDeclStmt->getSingleDecl()); 569 570 // Set GRO flag that it is not initialized yet 571 GroActiveFlag = CGF.CreateTempAlloca(Builder.getInt1Ty(), CharUnits::One(), 572 "gro.active"); 573 Builder.CreateStore(Builder.getFalse(), GroActiveFlag); 574 575 GroEmission = CGF.EmitAutoVarAlloca(*GroVarDecl); 576 auto *GroAlloca = dyn_cast_or_null<llvm::AllocaInst>( 577 GroEmission.getOriginalAllocatedAddress().getPointer()); 578 assert(GroAlloca && "expected alloca to be emitted"); 579 GroAlloca->setMetadata(llvm::LLVMContext::MD_coro_outside_frame, 580 llvm::MDNode::get(CGF.CGM.getLLVMContext(), {})); 581 582 // Remember the top of EHStack before emitting the cleanup. 583 auto old_top = CGF.EHStack.stable_begin(); 584 CGF.EmitAutoVarCleanups(GroEmission); 585 auto top = CGF.EHStack.stable_begin(); 586 587 // Make the cleanup conditional on gro.active 588 for (auto b = CGF.EHStack.find(top), e = CGF.EHStack.find(old_top); b != e; 589 b++) { 590 if (auto *Cleanup = dyn_cast<EHCleanupScope>(&*b)) { 591 assert(!Cleanup->hasActiveFlag() && "cleanup already has active flag?"); 592 Cleanup->setActiveFlag(GroActiveFlag); 593 Cleanup->setTestFlagInEHCleanup(); 594 Cleanup->setTestFlagInNormalCleanup(); 595 } 596 } 597 } 598 599 void EmitGroInit() { 600 if (DirectEmit) { 601 // ReturnValue should be valid as long as the coroutine's return type 602 // is not void. The assertion could help us to reduce the check later. 603 assert(CGF.ReturnValue.isValid() == (bool)S.getReturnStmt()); 604 // Now we have the promise, initialize the GRO. 605 // We need to emit `get_return_object` first. According to: 606 // [dcl.fct.def.coroutine]p7 607 // The call to get_return_object is sequenced before the call to 608 // initial_suspend and is invoked at most once. 609 // 610 // So we couldn't emit return value when we emit return statment, 611 // otherwise the call to get_return_object wouldn't be in front 612 // of initial_suspend. 613 if (CGF.ReturnValue.isValid()) { 614 CGF.EmitAnyExprToMem(S.getReturnValue(), CGF.ReturnValue, 615 S.getReturnValue()->getType().getQualifiers(), 616 /*IsInit*/ true); 617 } 618 return; 619 } 620 621 if (!GroActiveFlag.isValid()) { 622 // No Gro variable was allocated. Simply emit the call to 623 // get_return_object. 624 CGF.EmitStmt(S.getResultDecl()); 625 return; 626 } 627 628 CGF.EmitAutoVarInit(GroEmission); 629 Builder.CreateStore(Builder.getTrue(), GroActiveFlag); 630 } 631 }; 632 } // namespace 633 634 static void emitBodyAndFallthrough(CodeGenFunction &CGF, 635 const CoroutineBodyStmt &S, Stmt *Body) { 636 CGF.EmitStmt(Body); 637 const bool CanFallthrough = CGF.Builder.GetInsertBlock(); 638 if (CanFallthrough) 639 if (Stmt *OnFallthrough = S.getFallthroughHandler()) 640 CGF.EmitStmt(OnFallthrough); 641 } 642 643 void CodeGenFunction::EmitCoroutineBody(const CoroutineBodyStmt &S) { 644 auto *NullPtr = llvm::ConstantPointerNull::get(Builder.getPtrTy()); 645 auto &TI = CGM.getContext().getTargetInfo(); 646 unsigned NewAlign = TI.getNewAlign() / TI.getCharWidth(); 647 648 auto *EntryBB = Builder.GetInsertBlock(); 649 auto *AllocBB = createBasicBlock("coro.alloc"); 650 auto *InitBB = createBasicBlock("coro.init"); 651 auto *FinalBB = createBasicBlock("coro.final"); 652 auto *RetBB = createBasicBlock("coro.ret"); 653 654 auto *CoroId = Builder.CreateCall( 655 CGM.getIntrinsic(llvm::Intrinsic::coro_id), 656 {Builder.getInt32(NewAlign), NullPtr, NullPtr, NullPtr}); 657 createCoroData(*this, CurCoro, CoroId); 658 CurCoro.Data->SuspendBB = RetBB; 659 assert(ShouldEmitLifetimeMarkers && 660 "Must emit lifetime intrinsics for coroutines"); 661 662 // Backend is allowed to elide memory allocations, to help it, emit 663 // auto mem = coro.alloc() ? 0 : ... allocation code ...; 664 auto *CoroAlloc = Builder.CreateCall( 665 CGM.getIntrinsic(llvm::Intrinsic::coro_alloc), {CoroId}); 666 667 Builder.CreateCondBr(CoroAlloc, AllocBB, InitBB); 668 669 EmitBlock(AllocBB); 670 auto *AllocateCall = EmitScalarExpr(S.getAllocate()); 671 auto *AllocOrInvokeContBB = Builder.GetInsertBlock(); 672 673 // Handle allocation failure if 'ReturnStmtOnAllocFailure' was provided. 674 if (auto *RetOnAllocFailure = S.getReturnStmtOnAllocFailure()) { 675 auto *RetOnFailureBB = createBasicBlock("coro.ret.on.failure"); 676 677 // See if allocation was successful. 678 auto *NullPtr = llvm::ConstantPointerNull::get(Int8PtrTy); 679 auto *Cond = Builder.CreateICmpNE(AllocateCall, NullPtr); 680 // Expect the allocation to be successful. 681 emitCondLikelihoodViaExpectIntrinsic(Cond, Stmt::LH_Likely); 682 Builder.CreateCondBr(Cond, InitBB, RetOnFailureBB); 683 684 // If not, return OnAllocFailure object. 685 EmitBlock(RetOnFailureBB); 686 EmitStmt(RetOnAllocFailure); 687 } 688 else { 689 Builder.CreateBr(InitBB); 690 } 691 692 EmitBlock(InitBB); 693 694 // Pass the result of the allocation to coro.begin. 695 auto *Phi = Builder.CreatePHI(VoidPtrTy, 2); 696 Phi->addIncoming(NullPtr, EntryBB); 697 Phi->addIncoming(AllocateCall, AllocOrInvokeContBB); 698 auto *CoroBegin = Builder.CreateCall( 699 CGM.getIntrinsic(llvm::Intrinsic::coro_begin), {CoroId, Phi}); 700 CurCoro.Data->CoroBegin = CoroBegin; 701 702 GetReturnObjectManager GroManager(*this, S); 703 GroManager.EmitGroAlloca(); 704 705 CurCoro.Data->CleanupJD = getJumpDestInCurrentScope(RetBB); 706 { 707 CGDebugInfo *DI = getDebugInfo(); 708 ParamReferenceReplacerRAII ParamReplacer(LocalDeclMap); 709 CodeGenFunction::RunCleanupsScope ResumeScope(*this); 710 EHStack.pushCleanup<CallCoroDelete>(NormalAndEHCleanup, S.getDeallocate()); 711 712 // Create mapping between parameters and copy-params for coroutine function. 713 llvm::ArrayRef<const Stmt *> ParamMoves = S.getParamMoves(); 714 assert( 715 (ParamMoves.size() == 0 || (ParamMoves.size() == FnArgs.size())) && 716 "ParamMoves and FnArgs should be the same size for coroutine function"); 717 if (ParamMoves.size() == FnArgs.size() && DI) 718 for (const auto Pair : llvm::zip(FnArgs, ParamMoves)) 719 DI->getCoroutineParameterMappings().insert( 720 {std::get<0>(Pair), std::get<1>(Pair)}); 721 722 // Create parameter copies. We do it before creating a promise, since an 723 // evolution of coroutine TS may allow promise constructor to observe 724 // parameter copies. 725 for (auto *PM : S.getParamMoves()) { 726 EmitStmt(PM); 727 ParamReplacer.addCopy(cast<DeclStmt>(PM)); 728 // TODO: if(CoroParam(...)) need to surround ctor and dtor 729 // for the copy, so that llvm can elide it if the copy is 730 // not needed. 731 } 732 733 EmitStmt(S.getPromiseDeclStmt()); 734 735 Address PromiseAddr = GetAddrOfLocalVar(S.getPromiseDecl()); 736 auto *PromiseAddrVoidPtr = 737 new llvm::BitCastInst(PromiseAddr.getPointer(), VoidPtrTy, "", CoroId); 738 // Update CoroId to refer to the promise. We could not do it earlier because 739 // promise local variable was not emitted yet. 740 CoroId->setArgOperand(1, PromiseAddrVoidPtr); 741 742 // Now we have the promise, initialize the GRO 743 GroManager.EmitGroInit(); 744 745 EHStack.pushCleanup<CallCoroEnd>(EHCleanup); 746 747 CurCoro.Data->CurrentAwaitKind = AwaitKind::Init; 748 CurCoro.Data->ExceptionHandler = S.getExceptionHandler(); 749 EmitStmt(S.getInitSuspendStmt()); 750 CurCoro.Data->FinalJD = getJumpDestInCurrentScope(FinalBB); 751 752 CurCoro.Data->CurrentAwaitKind = AwaitKind::Normal; 753 754 if (CurCoro.Data->ExceptionHandler) { 755 // If we generated IR to record whether an exception was thrown from 756 // 'await_resume', then use that IR to determine whether the coroutine 757 // body should be skipped. 758 // If we didn't generate the IR (perhaps because 'await_resume' was marked 759 // as 'noexcept'), then we skip this check. 760 BasicBlock *ContBB = nullptr; 761 if (CurCoro.Data->ResumeEHVar) { 762 BasicBlock *BodyBB = createBasicBlock("coro.resumed.body"); 763 ContBB = createBasicBlock("coro.resumed.cont"); 764 Value *SkipBody = Builder.CreateFlagLoad(CurCoro.Data->ResumeEHVar, 765 "coro.resumed.eh"); 766 Builder.CreateCondBr(SkipBody, ContBB, BodyBB); 767 EmitBlock(BodyBB); 768 } 769 770 auto Loc = S.getBeginLoc(); 771 CXXCatchStmt Catch(Loc, /*exDecl=*/nullptr, 772 CurCoro.Data->ExceptionHandler); 773 auto *TryStmt = 774 CXXTryStmt::Create(getContext(), Loc, S.getBody(), &Catch); 775 776 EnterCXXTryStmt(*TryStmt); 777 emitBodyAndFallthrough(*this, S, TryStmt->getTryBlock()); 778 ExitCXXTryStmt(*TryStmt); 779 780 if (ContBB) 781 EmitBlock(ContBB); 782 } 783 else { 784 emitBodyAndFallthrough(*this, S, S.getBody()); 785 } 786 787 // See if we need to generate final suspend. 788 const bool CanFallthrough = Builder.GetInsertBlock(); 789 const bool HasCoreturns = CurCoro.Data->CoreturnCount > 0; 790 if (CanFallthrough || HasCoreturns) { 791 EmitBlock(FinalBB); 792 CurCoro.Data->CurrentAwaitKind = AwaitKind::Final; 793 EmitStmt(S.getFinalSuspendStmt()); 794 } else { 795 // We don't need FinalBB. Emit it to make sure the block is deleted. 796 EmitBlock(FinalBB, /*IsFinished=*/true); 797 } 798 } 799 800 EmitBlock(RetBB); 801 // Emit coro.end before getReturnStmt (and parameter destructors), since 802 // resume and destroy parts of the coroutine should not include them. 803 llvm::Function *CoroEnd = CGM.getIntrinsic(llvm::Intrinsic::coro_end); 804 Builder.CreateCall(CoroEnd, 805 {NullPtr, Builder.getFalse(), 806 llvm::ConstantTokenNone::get(CoroEnd->getContext())}); 807 808 if (Stmt *Ret = S.getReturnStmt()) { 809 // Since we already emitted the return value above, so we shouldn't 810 // emit it again here. 811 if (GroManager.DirectEmit) 812 cast<ReturnStmt>(Ret)->setRetValue(nullptr); 813 EmitStmt(Ret); 814 } 815 816 // LLVM require the frontend to mark the coroutine. 817 CurFn->setPresplitCoroutine(); 818 819 if (CXXRecordDecl *RD = FnRetTy->getAsCXXRecordDecl(); 820 RD && RD->hasAttr<CoroOnlyDestroyWhenCompleteAttr>()) 821 CurFn->setCoroDestroyOnlyWhenComplete(); 822 } 823 824 // Emit coroutine intrinsic and patch up arguments of the token type. 825 RValue CodeGenFunction::EmitCoroutineIntrinsic(const CallExpr *E, 826 unsigned int IID) { 827 SmallVector<llvm::Value *, 8> Args; 828 switch (IID) { 829 default: 830 break; 831 // The coro.frame builtin is replaced with an SSA value of the coro.begin 832 // intrinsic. 833 case llvm::Intrinsic::coro_frame: { 834 if (CurCoro.Data && CurCoro.Data->CoroBegin) { 835 return RValue::get(CurCoro.Data->CoroBegin); 836 } 837 CGM.Error(E->getBeginLoc(), "this builtin expect that __builtin_coro_begin " 838 "has been used earlier in this function"); 839 auto *NullPtr = llvm::ConstantPointerNull::get(Builder.getPtrTy()); 840 return RValue::get(NullPtr); 841 } 842 case llvm::Intrinsic::coro_size: { 843 auto &Context = getContext(); 844 CanQualType SizeTy = Context.getSizeType(); 845 llvm::IntegerType *T = Builder.getIntNTy(Context.getTypeSize(SizeTy)); 846 llvm::Function *F = CGM.getIntrinsic(llvm::Intrinsic::coro_size, T); 847 return RValue::get(Builder.CreateCall(F)); 848 } 849 case llvm::Intrinsic::coro_align: { 850 auto &Context = getContext(); 851 CanQualType SizeTy = Context.getSizeType(); 852 llvm::IntegerType *T = Builder.getIntNTy(Context.getTypeSize(SizeTy)); 853 llvm::Function *F = CGM.getIntrinsic(llvm::Intrinsic::coro_align, T); 854 return RValue::get(Builder.CreateCall(F)); 855 } 856 // The following three intrinsics take a token parameter referring to a token 857 // returned by earlier call to @llvm.coro.id. Since we cannot represent it in 858 // builtins, we patch it up here. 859 case llvm::Intrinsic::coro_alloc: 860 case llvm::Intrinsic::coro_begin: 861 case llvm::Intrinsic::coro_free: { 862 if (CurCoro.Data && CurCoro.Data->CoroId) { 863 Args.push_back(CurCoro.Data->CoroId); 864 break; 865 } 866 CGM.Error(E->getBeginLoc(), "this builtin expect that __builtin_coro_id has" 867 " been used earlier in this function"); 868 // Fallthrough to the next case to add TokenNone as the first argument. 869 [[fallthrough]]; 870 } 871 // @llvm.coro.suspend takes a token parameter. Add token 'none' as the first 872 // argument. 873 case llvm::Intrinsic::coro_suspend: 874 Args.push_back(llvm::ConstantTokenNone::get(getLLVMContext())); 875 break; 876 } 877 for (const Expr *Arg : E->arguments()) 878 Args.push_back(EmitScalarExpr(Arg)); 879 // @llvm.coro.end takes a token parameter. Add token 'none' as the last 880 // argument. 881 if (IID == llvm::Intrinsic::coro_end) 882 Args.push_back(llvm::ConstantTokenNone::get(getLLVMContext())); 883 884 llvm::Function *F = CGM.getIntrinsic(IID); 885 llvm::CallInst *Call = Builder.CreateCall(F, Args); 886 887 // Note: The following code is to enable to emit coro.id and coro.begin by 888 // hand to experiment with coroutines in C. 889 // If we see @llvm.coro.id remember it in the CoroData. We will update 890 // coro.alloc, coro.begin and coro.free intrinsics to refer to it. 891 if (IID == llvm::Intrinsic::coro_id) { 892 createCoroData(*this, CurCoro, Call, E); 893 } 894 else if (IID == llvm::Intrinsic::coro_begin) { 895 if (CurCoro.Data) 896 CurCoro.Data->CoroBegin = Call; 897 } 898 else if (IID == llvm::Intrinsic::coro_free) { 899 // Remember the last coro_free as we need it to build the conditional 900 // deletion of the coroutine frame. 901 if (CurCoro.Data) 902 CurCoro.Data->LastCoroFree = Call; 903 } 904 return RValue::get(Call); 905 } 906