1 //===--- ParseInit.cpp - Initializer Parsing ------------------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file implements initializer parsing as specified by C99 6.7.8. 10 // 11 //===----------------------------------------------------------------------===// 12 13 #include "clang/Basic/TokenKinds.h" 14 #include "clang/Parse/ParseDiagnostic.h" 15 #include "clang/Parse/Parser.h" 16 #include "clang/Parse/RAIIObjectsForParser.h" 17 #include "clang/Sema/Designator.h" 18 #include "clang/Sema/EnterExpressionEvaluationContext.h" 19 #include "clang/Sema/Ownership.h" 20 #include "clang/Sema/Scope.h" 21 #include "llvm/ADT/STLExtras.h" 22 #include "llvm/ADT/SmallString.h" 23 using namespace clang; 24 25 26 /// MayBeDesignationStart - Return true if the current token might be the start 27 /// of a designator. If we can tell it is impossible that it is a designator, 28 /// return false. 29 bool Parser::MayBeDesignationStart() { 30 switch (Tok.getKind()) { 31 default: 32 return false; 33 34 case tok::period: // designator: '.' identifier 35 return true; 36 37 case tok::l_square: { // designator: array-designator 38 if (!PP.getLangOpts().CPlusPlus11) 39 return true; 40 41 // C++11 lambda expressions and C99 designators can be ambiguous all the 42 // way through the closing ']' and to the next character. Handle the easy 43 // cases here, and fall back to tentative parsing if those fail. 44 switch (PP.LookAhead(0).getKind()) { 45 case tok::equal: 46 case tok::ellipsis: 47 case tok::r_square: 48 // Definitely starts a lambda expression. 49 return false; 50 51 case tok::amp: 52 case tok::kw_this: 53 case tok::star: 54 case tok::identifier: 55 // We have to do additional analysis, because these could be the 56 // start of a constant expression or a lambda capture list. 57 break; 58 59 default: 60 // Anything not mentioned above cannot occur following a '[' in a 61 // lambda expression. 62 return true; 63 } 64 65 // Handle the complicated case below. 66 break; 67 } 68 case tok::identifier: // designation: identifier ':' 69 return PP.LookAhead(0).is(tok::colon); 70 } 71 72 // Parse up to (at most) the token after the closing ']' to determine 73 // whether this is a C99 designator or a lambda. 74 RevertingTentativeParsingAction Tentative(*this); 75 76 LambdaIntroducer Intro; 77 LambdaIntroducerTentativeParse ParseResult; 78 if (ParseLambdaIntroducer(Intro, &ParseResult)) { 79 // Hit and diagnosed an error in a lambda. 80 // FIXME: Tell the caller this happened so they can recover. 81 return true; 82 } 83 84 switch (ParseResult) { 85 case LambdaIntroducerTentativeParse::Success: 86 case LambdaIntroducerTentativeParse::Incomplete: 87 // Might be a lambda-expression. Keep looking. 88 // FIXME: If our tentative parse was not incomplete, parse the lambda from 89 // here rather than throwing away then reparsing the LambdaIntroducer. 90 break; 91 92 case LambdaIntroducerTentativeParse::MessageSend: 93 case LambdaIntroducerTentativeParse::Invalid: 94 // Can't be a lambda-expression. Treat it as a designator. 95 // FIXME: Should we disambiguate against a message-send? 96 return true; 97 } 98 99 // Once we hit the closing square bracket, we look at the next 100 // token. If it's an '=', this is a designator. Otherwise, it's a 101 // lambda expression. This decision favors lambdas over the older 102 // GNU designator syntax, which allows one to omit the '=', but is 103 // consistent with GCC. 104 return Tok.is(tok::equal); 105 } 106 107 static void CheckArrayDesignatorSyntax(Parser &P, SourceLocation Loc, 108 Designation &Desig) { 109 // If we have exactly one array designator, this used the GNU 110 // 'designation: array-designator' extension, otherwise there should be no 111 // designators at all! 112 if (Desig.getNumDesignators() == 1 && 113 (Desig.getDesignator(0).isArrayDesignator() || 114 Desig.getDesignator(0).isArrayRangeDesignator())) 115 P.Diag(Loc, diag::ext_gnu_missing_equal_designator); 116 else if (Desig.getNumDesignators() > 0) 117 P.Diag(Loc, diag::err_expected_equal_designator); 118 } 119 120 /// ParseInitializerWithPotentialDesignator - Parse the 'initializer' production 121 /// checking to see if the token stream starts with a designator. 122 /// 123 /// C99: 124 /// 125 /// designation: 126 /// designator-list '=' 127 /// [GNU] array-designator 128 /// [GNU] identifier ':' 129 /// 130 /// designator-list: 131 /// designator 132 /// designator-list designator 133 /// 134 /// designator: 135 /// array-designator 136 /// '.' identifier 137 /// 138 /// array-designator: 139 /// '[' constant-expression ']' 140 /// [GNU] '[' constant-expression '...' constant-expression ']' 141 /// 142 /// C++20: 143 /// 144 /// designated-initializer-list: 145 /// designated-initializer-clause 146 /// designated-initializer-list ',' designated-initializer-clause 147 /// 148 /// designated-initializer-clause: 149 /// designator brace-or-equal-initializer 150 /// 151 /// designator: 152 /// '.' identifier 153 /// 154 /// We allow the C99 syntax extensions in C++20, but do not allow the C++20 155 /// extension (a braced-init-list after the designator with no '=') in C99. 156 /// 157 /// NOTE: [OBC] allows '[ objc-receiver objc-message-args ]' as an 158 /// initializer (because it is an expression). We need to consider this case 159 /// when parsing array designators. 160 /// 161 /// \p CodeCompleteCB is called with Designation parsed so far. 162 ExprResult Parser::ParseInitializerWithPotentialDesignator( 163 DesignatorCompletionInfo DesignatorCompletion) { 164 // If this is the old-style GNU extension: 165 // designation ::= identifier ':' 166 // Handle it as a field designator. Otherwise, this must be the start of a 167 // normal expression. 168 if (Tok.is(tok::identifier)) { 169 const IdentifierInfo *FieldName = Tok.getIdentifierInfo(); 170 171 SmallString<256> NewSyntax; 172 llvm::raw_svector_ostream(NewSyntax) << '.' << FieldName->getName() 173 << " = "; 174 175 SourceLocation NameLoc = ConsumeToken(); // Eat the identifier. 176 177 assert(Tok.is(tok::colon) && "MayBeDesignationStart not working properly!"); 178 SourceLocation ColonLoc = ConsumeToken(); 179 180 Diag(NameLoc, diag::ext_gnu_old_style_field_designator) 181 << FixItHint::CreateReplacement(SourceRange(NameLoc, ColonLoc), 182 NewSyntax); 183 184 Designation D; 185 D.AddDesignator(Designator::CreateFieldDesignator( 186 FieldName, SourceLocation(), NameLoc)); 187 PreferredType.enterDesignatedInitializer( 188 Tok.getLocation(), DesignatorCompletion.PreferredBaseType, D); 189 return Actions.ActOnDesignatedInitializer(D, ColonLoc, true, 190 ParseInitializer()); 191 } 192 193 // Desig - This is initialized when we see our first designator. We may have 194 // an objc message send with no designator, so we don't want to create this 195 // eagerly. 196 Designation Desig; 197 198 // Parse each designator in the designator list until we find an initializer. 199 while (Tok.is(tok::period) || Tok.is(tok::l_square)) { 200 if (Tok.is(tok::period)) { 201 // designator: '.' identifier 202 SourceLocation DotLoc = ConsumeToken(); 203 204 if (Tok.is(tok::code_completion)) { 205 cutOffParsing(); 206 Actions.CodeCompleteDesignator(DesignatorCompletion.PreferredBaseType, 207 DesignatorCompletion.InitExprs, Desig); 208 return ExprError(); 209 } 210 if (Tok.isNot(tok::identifier)) { 211 Diag(Tok.getLocation(), diag::err_expected_field_designator); 212 return ExprError(); 213 } 214 215 Desig.AddDesignator(Designator::CreateFieldDesignator( 216 Tok.getIdentifierInfo(), DotLoc, Tok.getLocation())); 217 ConsumeToken(); // Eat the identifier. 218 continue; 219 } 220 221 // We must have either an array designator now or an objc message send. 222 assert(Tok.is(tok::l_square) && "Unexpected token!"); 223 224 // Handle the two forms of array designator: 225 // array-designator: '[' constant-expression ']' 226 // array-designator: '[' constant-expression '...' constant-expression ']' 227 // 228 // Also, we have to handle the case where the expression after the 229 // designator an an objc message send: '[' objc-message-expr ']'. 230 // Interesting cases are: 231 // [foo bar] -> objc message send 232 // [foo] -> array designator 233 // [foo ... bar] -> array designator 234 // [4][foo bar] -> obsolete GNU designation with objc message send. 235 // 236 // We do not need to check for an expression starting with [[ here. If it 237 // contains an Objective-C message send, then it is not an ill-formed 238 // attribute. If it is a lambda-expression within an array-designator, then 239 // it will be rejected because a constant-expression cannot begin with a 240 // lambda-expression. 241 InMessageExpressionRAIIObject InMessage(*this, true); 242 243 BalancedDelimiterTracker T(*this, tok::l_square); 244 T.consumeOpen(); 245 SourceLocation StartLoc = T.getOpenLocation(); 246 247 ExprResult Idx; 248 249 // If Objective-C is enabled and this is a typename (class message 250 // send) or send to 'super', parse this as a message send 251 // expression. We handle C++ and C separately, since C++ requires 252 // much more complicated parsing. 253 if (getLangOpts().ObjC && getLangOpts().CPlusPlus) { 254 // Send to 'super'. 255 if (Tok.is(tok::identifier) && Tok.getIdentifierInfo() == Ident_super && 256 NextToken().isNot(tok::period) && 257 getCurScope()->isInObjcMethodScope()) { 258 CheckArrayDesignatorSyntax(*this, StartLoc, Desig); 259 return ParseAssignmentExprWithObjCMessageExprStart( 260 StartLoc, ConsumeToken(), nullptr, nullptr); 261 } 262 263 // Parse the receiver, which is either a type or an expression. 264 bool IsExpr; 265 void *TypeOrExpr; 266 if (ParseObjCXXMessageReceiver(IsExpr, TypeOrExpr)) { 267 SkipUntil(tok::r_square, StopAtSemi); 268 return ExprError(); 269 } 270 271 // If the receiver was a type, we have a class message; parse 272 // the rest of it. 273 if (!IsExpr) { 274 CheckArrayDesignatorSyntax(*this, StartLoc, Desig); 275 return ParseAssignmentExprWithObjCMessageExprStart(StartLoc, 276 SourceLocation(), 277 ParsedType::getFromOpaquePtr(TypeOrExpr), 278 nullptr); 279 } 280 281 // If the receiver was an expression, we still don't know 282 // whether we have a message send or an array designator; just 283 // adopt the expression for further analysis below. 284 // FIXME: potentially-potentially evaluated expression above? 285 Idx = ExprResult(static_cast<Expr*>(TypeOrExpr)); 286 } else if (getLangOpts().ObjC && Tok.is(tok::identifier)) { 287 IdentifierInfo *II = Tok.getIdentifierInfo(); 288 SourceLocation IILoc = Tok.getLocation(); 289 ParsedType ReceiverType; 290 // Three cases. This is a message send to a type: [type foo] 291 // This is a message send to super: [super foo] 292 // This is a message sent to an expr: [super.bar foo] 293 switch (Actions.getObjCMessageKind( 294 getCurScope(), II, IILoc, II == Ident_super, 295 NextToken().is(tok::period), ReceiverType)) { 296 case Sema::ObjCSuperMessage: 297 CheckArrayDesignatorSyntax(*this, StartLoc, Desig); 298 return ParseAssignmentExprWithObjCMessageExprStart( 299 StartLoc, ConsumeToken(), nullptr, nullptr); 300 301 case Sema::ObjCClassMessage: 302 CheckArrayDesignatorSyntax(*this, StartLoc, Desig); 303 ConsumeToken(); // the identifier 304 if (!ReceiverType) { 305 SkipUntil(tok::r_square, StopAtSemi); 306 return ExprError(); 307 } 308 309 // Parse type arguments and protocol qualifiers. 310 if (Tok.is(tok::less)) { 311 SourceLocation NewEndLoc; 312 TypeResult NewReceiverType 313 = parseObjCTypeArgsAndProtocolQualifiers(IILoc, ReceiverType, 314 /*consumeLastToken=*/true, 315 NewEndLoc); 316 if (!NewReceiverType.isUsable()) { 317 SkipUntil(tok::r_square, StopAtSemi); 318 return ExprError(); 319 } 320 321 ReceiverType = NewReceiverType.get(); 322 } 323 324 return ParseAssignmentExprWithObjCMessageExprStart(StartLoc, 325 SourceLocation(), 326 ReceiverType, 327 nullptr); 328 329 case Sema::ObjCInstanceMessage: 330 // Fall through; we'll just parse the expression and 331 // (possibly) treat this like an Objective-C message send 332 // later. 333 break; 334 } 335 } 336 337 // Parse the index expression, if we haven't already gotten one 338 // above (which can only happen in Objective-C++). 339 // Note that we parse this as an assignment expression, not a constant 340 // expression (allowing *=, =, etc) to handle the objc case. Sema needs 341 // to validate that the expression is a constant. 342 // FIXME: We also need to tell Sema that we're in a 343 // potentially-potentially evaluated context. 344 if (!Idx.get()) { 345 Idx = ParseAssignmentExpression(); 346 if (Idx.isInvalid()) { 347 SkipUntil(tok::r_square, StopAtSemi); 348 return Idx; 349 } 350 } 351 352 // Given an expression, we could either have a designator (if the next 353 // tokens are '...' or ']' or an objc message send. If this is an objc 354 // message send, handle it now. An objc-message send is the start of 355 // an assignment-expression production. 356 if (getLangOpts().ObjC && Tok.isNot(tok::ellipsis) && 357 Tok.isNot(tok::r_square)) { 358 CheckArrayDesignatorSyntax(*this, Tok.getLocation(), Desig); 359 return ParseAssignmentExprWithObjCMessageExprStart( 360 StartLoc, SourceLocation(), nullptr, Idx.get()); 361 } 362 363 // If this is a normal array designator, remember it. 364 if (Tok.isNot(tok::ellipsis)) { 365 Desig.AddDesignator(Designator::CreateArrayDesignator(Idx.get(), 366 StartLoc)); 367 } else { 368 // Handle the gnu array range extension. 369 Diag(Tok, diag::ext_gnu_array_range); 370 SourceLocation EllipsisLoc = ConsumeToken(); 371 372 ExprResult RHS(ParseConstantExpression()); 373 if (RHS.isInvalid()) { 374 SkipUntil(tok::r_square, StopAtSemi); 375 return RHS; 376 } 377 Desig.AddDesignator(Designator::CreateArrayRangeDesignator( 378 Idx.get(), RHS.get(), StartLoc, EllipsisLoc)); 379 } 380 381 T.consumeClose(); 382 Desig.getDesignator(Desig.getNumDesignators() - 1).setRBracketLoc( 383 T.getCloseLocation()); 384 } 385 386 // Okay, we're done with the designator sequence. We know that there must be 387 // at least one designator, because the only case we can get into this method 388 // without a designator is when we have an objc message send. That case is 389 // handled and returned from above. 390 assert(!Desig.empty() && "Designator is empty?"); 391 392 // Handle a normal designator sequence end, which is an equal. 393 if (Tok.is(tok::equal)) { 394 SourceLocation EqualLoc = ConsumeToken(); 395 PreferredType.enterDesignatedInitializer( 396 Tok.getLocation(), DesignatorCompletion.PreferredBaseType, Desig); 397 return Actions.ActOnDesignatedInitializer(Desig, EqualLoc, false, 398 ParseInitializer()); 399 } 400 401 // Handle a C++20 braced designated initialization, which results in 402 // direct-list-initialization of the aggregate element. We allow this as an 403 // extension from C++11 onwards (when direct-list-initialization was added). 404 if (Tok.is(tok::l_brace) && getLangOpts().CPlusPlus11) { 405 PreferredType.enterDesignatedInitializer( 406 Tok.getLocation(), DesignatorCompletion.PreferredBaseType, Desig); 407 return Actions.ActOnDesignatedInitializer(Desig, SourceLocation(), false, 408 ParseBraceInitializer()); 409 } 410 411 // We read some number of designators and found something that isn't an = or 412 // an initializer. If we have exactly one array designator, this 413 // is the GNU 'designation: array-designator' extension. Otherwise, it is a 414 // parse error. 415 if (Desig.getNumDesignators() == 1 && 416 (Desig.getDesignator(0).isArrayDesignator() || 417 Desig.getDesignator(0).isArrayRangeDesignator())) { 418 Diag(Tok, diag::ext_gnu_missing_equal_designator) 419 << FixItHint::CreateInsertion(Tok.getLocation(), "= "); 420 return Actions.ActOnDesignatedInitializer(Desig, Tok.getLocation(), 421 true, ParseInitializer()); 422 } 423 424 Diag(Tok, diag::err_expected_equal_designator); 425 return ExprError(); 426 } 427 428 /// ParseBraceInitializer - Called when parsing an initializer that has a 429 /// leading open brace. 430 /// 431 /// initializer: [C99 6.7.8] 432 /// '{' initializer-list '}' 433 /// '{' initializer-list ',' '}' 434 /// [C23] '{' '}' 435 /// 436 /// initializer-list: 437 /// designation[opt] initializer ...[opt] 438 /// initializer-list ',' designation[opt] initializer ...[opt] 439 /// 440 ExprResult Parser::ParseBraceInitializer() { 441 InMessageExpressionRAIIObject InMessage(*this, false); 442 443 BalancedDelimiterTracker T(*this, tok::l_brace); 444 T.consumeOpen(); 445 SourceLocation LBraceLoc = T.getOpenLocation(); 446 447 /// InitExprs - This is the actual list of expressions contained in the 448 /// initializer. 449 ExprVector InitExprs; 450 451 if (Tok.is(tok::r_brace)) { 452 // Empty initializers are a C++ feature and a GNU extension to C before C23. 453 if (!getLangOpts().CPlusPlus) { 454 Diag(LBraceLoc, getLangOpts().C23 455 ? diag::warn_c23_compat_empty_initializer 456 : diag::ext_c_empty_initializer); 457 } 458 // Match the '}'. 459 return Actions.ActOnInitList(LBraceLoc, std::nullopt, ConsumeBrace()); 460 } 461 462 // Enter an appropriate expression evaluation context for an initializer list. 463 EnterExpressionEvaluationContext EnterContext( 464 Actions, EnterExpressionEvaluationContext::InitList); 465 466 bool InitExprsOk = true; 467 QualType LikelyType = PreferredType.get(T.getOpenLocation()); 468 DesignatorCompletionInfo DesignatorCompletion{InitExprs, LikelyType}; 469 bool CalledSignatureHelp = false; 470 auto RunSignatureHelp = [&] { 471 QualType PreferredType; 472 if (!LikelyType.isNull()) 473 PreferredType = Actions.ProduceConstructorSignatureHelp( 474 LikelyType->getCanonicalTypeInternal(), T.getOpenLocation(), 475 InitExprs, T.getOpenLocation(), /*Braced=*/true); 476 CalledSignatureHelp = true; 477 return PreferredType; 478 }; 479 480 while (true) { 481 PreferredType.enterFunctionArgument(Tok.getLocation(), RunSignatureHelp); 482 483 // Handle Microsoft __if_exists/if_not_exists if necessary. 484 if (getLangOpts().MicrosoftExt && (Tok.is(tok::kw___if_exists) || 485 Tok.is(tok::kw___if_not_exists))) { 486 if (ParseMicrosoftIfExistsBraceInitializer(InitExprs, InitExprsOk)) { 487 if (Tok.isNot(tok::comma)) break; 488 ConsumeToken(); 489 } 490 if (Tok.is(tok::r_brace)) break; 491 continue; 492 } 493 494 // Parse: designation[opt] initializer 495 496 // If we know that this cannot be a designation, just parse the nested 497 // initializer directly. 498 ExprResult SubElt; 499 if (MayBeDesignationStart()) 500 SubElt = ParseInitializerWithPotentialDesignator(DesignatorCompletion); 501 else 502 SubElt = ParseInitializer(); 503 504 if (Tok.is(tok::ellipsis)) 505 SubElt = Actions.ActOnPackExpansion(SubElt.get(), ConsumeToken()); 506 507 SubElt = Actions.CorrectDelayedTyposInExpr(SubElt.get()); 508 509 // If we couldn't parse the subelement, bail out. 510 if (SubElt.isUsable()) { 511 InitExprs.push_back(SubElt.get()); 512 } else { 513 InitExprsOk = false; 514 515 // We have two ways to try to recover from this error: if the code looks 516 // grammatically ok (i.e. we have a comma coming up) try to continue 517 // parsing the rest of the initializer. This allows us to emit 518 // diagnostics for later elements that we find. If we don't see a comma, 519 // assume there is a parse error, and just skip to recover. 520 // FIXME: This comment doesn't sound right. If there is a r_brace 521 // immediately, it can't be an error, since there is no other way of 522 // leaving this loop except through this if. 523 if (Tok.isNot(tok::comma)) { 524 SkipUntil(tok::r_brace, StopBeforeMatch); 525 break; 526 } 527 } 528 529 // If we don't have a comma continued list, we're done. 530 if (Tok.isNot(tok::comma)) break; 531 532 // TODO: save comma locations if some client cares. 533 ConsumeToken(); 534 535 // Handle trailing comma. 536 if (Tok.is(tok::r_brace)) break; 537 } 538 539 bool closed = !T.consumeClose(); 540 541 if (InitExprsOk && closed) 542 return Actions.ActOnInitList(LBraceLoc, InitExprs, 543 T.getCloseLocation()); 544 545 return ExprError(); // an error occurred. 546 } 547 548 549 // Return true if a comma (or closing brace) is necessary after the 550 // __if_exists/if_not_exists statement. 551 bool Parser::ParseMicrosoftIfExistsBraceInitializer(ExprVector &InitExprs, 552 bool &InitExprsOk) { 553 bool trailingComma = false; 554 IfExistsCondition Result; 555 if (ParseMicrosoftIfExistsCondition(Result)) 556 return false; 557 558 BalancedDelimiterTracker Braces(*this, tok::l_brace); 559 if (Braces.consumeOpen()) { 560 Diag(Tok, diag::err_expected) << tok::l_brace; 561 return false; 562 } 563 564 switch (Result.Behavior) { 565 case IEB_Parse: 566 // Parse the declarations below. 567 break; 568 569 case IEB_Dependent: 570 Diag(Result.KeywordLoc, diag::warn_microsoft_dependent_exists) 571 << Result.IsIfExists; 572 // Fall through to skip. 573 [[fallthrough]]; 574 575 case IEB_Skip: 576 Braces.skipToEnd(); 577 return false; 578 } 579 580 DesignatorCompletionInfo DesignatorCompletion{ 581 InitExprs, 582 PreferredType.get(Braces.getOpenLocation()), 583 }; 584 while (!isEofOrEom()) { 585 trailingComma = false; 586 // If we know that this cannot be a designation, just parse the nested 587 // initializer directly. 588 ExprResult SubElt; 589 if (MayBeDesignationStart()) 590 SubElt = ParseInitializerWithPotentialDesignator(DesignatorCompletion); 591 else 592 SubElt = ParseInitializer(); 593 594 if (Tok.is(tok::ellipsis)) 595 SubElt = Actions.ActOnPackExpansion(SubElt.get(), ConsumeToken()); 596 597 // If we couldn't parse the subelement, bail out. 598 if (!SubElt.isInvalid()) 599 InitExprs.push_back(SubElt.get()); 600 else 601 InitExprsOk = false; 602 603 if (Tok.is(tok::comma)) { 604 ConsumeToken(); 605 trailingComma = true; 606 } 607 608 if (Tok.is(tok::r_brace)) 609 break; 610 } 611 612 Braces.consumeClose(); 613 614 return !trailingComma; 615 } 616