1 //===--- ParseInit.cpp - Initializer Parsing ------------------------------===// 2 // 3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions. 4 // See https://llvm.org/LICENSE.txt for license information. 5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception 6 // 7 //===----------------------------------------------------------------------===// 8 // 9 // This file implements initializer parsing as specified by C99 6.7.8. 10 // 11 //===----------------------------------------------------------------------===// 12 13 #include "clang/Basic/TokenKinds.h" 14 #include "clang/Parse/ParseDiagnostic.h" 15 #include "clang/Parse/Parser.h" 16 #include "clang/Parse/RAIIObjectsForParser.h" 17 #include "clang/Sema/Designator.h" 18 #include "clang/Sema/Ownership.h" 19 #include "clang/Sema/Scope.h" 20 #include "llvm/ADT/STLExtras.h" 21 #include "llvm/ADT/SmallString.h" 22 using namespace clang; 23 24 25 /// MayBeDesignationStart - Return true if the current token might be the start 26 /// of a designator. If we can tell it is impossible that it is a designator, 27 /// return false. 28 bool Parser::MayBeDesignationStart() { 29 switch (Tok.getKind()) { 30 default: 31 return false; 32 33 case tok::period: // designator: '.' identifier 34 return true; 35 36 case tok::l_square: { // designator: array-designator 37 if (!PP.getLangOpts().CPlusPlus11) 38 return true; 39 40 // C++11 lambda expressions and C99 designators can be ambiguous all the 41 // way through the closing ']' and to the next character. Handle the easy 42 // cases here, and fall back to tentative parsing if those fail. 43 switch (PP.LookAhead(0).getKind()) { 44 case tok::equal: 45 case tok::ellipsis: 46 case tok::r_square: 47 // Definitely starts a lambda expression. 48 return false; 49 50 case tok::amp: 51 case tok::kw_this: 52 case tok::star: 53 case tok::identifier: 54 // We have to do additional analysis, because these could be the 55 // start of a constant expression or a lambda capture list. 56 break; 57 58 default: 59 // Anything not mentioned above cannot occur following a '[' in a 60 // lambda expression. 61 return true; 62 } 63 64 // Handle the complicated case below. 65 break; 66 } 67 case tok::identifier: // designation: identifier ':' 68 return PP.LookAhead(0).is(tok::colon); 69 } 70 71 // Parse up to (at most) the token after the closing ']' to determine 72 // whether this is a C99 designator or a lambda. 73 RevertingTentativeParsingAction Tentative(*this); 74 75 LambdaIntroducer Intro; 76 LambdaIntroducerTentativeParse ParseResult; 77 if (ParseLambdaIntroducer(Intro, &ParseResult)) { 78 // Hit and diagnosed an error in a lambda. 79 // FIXME: Tell the caller this happened so they can recover. 80 return true; 81 } 82 83 switch (ParseResult) { 84 case LambdaIntroducerTentativeParse::Success: 85 case LambdaIntroducerTentativeParse::Incomplete: 86 // Might be a lambda-expression. Keep looking. 87 // FIXME: If our tentative parse was not incomplete, parse the lambda from 88 // here rather than throwing away then reparsing the LambdaIntroducer. 89 break; 90 91 case LambdaIntroducerTentativeParse::MessageSend: 92 case LambdaIntroducerTentativeParse::Invalid: 93 // Can't be a lambda-expression. Treat it as a designator. 94 // FIXME: Should we disambiguate against a message-send? 95 return true; 96 } 97 98 // Once we hit the closing square bracket, we look at the next 99 // token. If it's an '=', this is a designator. Otherwise, it's a 100 // lambda expression. This decision favors lambdas over the older 101 // GNU designator syntax, which allows one to omit the '=', but is 102 // consistent with GCC. 103 return Tok.is(tok::equal); 104 } 105 106 static void CheckArrayDesignatorSyntax(Parser &P, SourceLocation Loc, 107 Designation &Desig) { 108 // If we have exactly one array designator, this used the GNU 109 // 'designation: array-designator' extension, otherwise there should be no 110 // designators at all! 111 if (Desig.getNumDesignators() == 1 && 112 (Desig.getDesignator(0).isArrayDesignator() || 113 Desig.getDesignator(0).isArrayRangeDesignator())) 114 P.Diag(Loc, diag::ext_gnu_missing_equal_designator); 115 else if (Desig.getNumDesignators() > 0) 116 P.Diag(Loc, diag::err_expected_equal_designator); 117 } 118 119 /// ParseInitializerWithPotentialDesignator - Parse the 'initializer' production 120 /// checking to see if the token stream starts with a designator. 121 /// 122 /// C99: 123 /// 124 /// designation: 125 /// designator-list '=' 126 /// [GNU] array-designator 127 /// [GNU] identifier ':' 128 /// 129 /// designator-list: 130 /// designator 131 /// designator-list designator 132 /// 133 /// designator: 134 /// array-designator 135 /// '.' identifier 136 /// 137 /// array-designator: 138 /// '[' constant-expression ']' 139 /// [GNU] '[' constant-expression '...' constant-expression ']' 140 /// 141 /// C++20: 142 /// 143 /// designated-initializer-list: 144 /// designated-initializer-clause 145 /// designated-initializer-list ',' designated-initializer-clause 146 /// 147 /// designated-initializer-clause: 148 /// designator brace-or-equal-initializer 149 /// 150 /// designator: 151 /// '.' identifier 152 /// 153 /// We allow the C99 syntax extensions in C++20, but do not allow the C++20 154 /// extension (a braced-init-list after the designator with no '=') in C99. 155 /// 156 /// NOTE: [OBC] allows '[ objc-receiver objc-message-args ]' as an 157 /// initializer (because it is an expression). We need to consider this case 158 /// when parsing array designators. 159 /// 160 /// \p CodeCompleteCB is called with Designation parsed so far. 161 ExprResult Parser::ParseInitializerWithPotentialDesignator( 162 DesignatorCompletionInfo DesignatorCompletion) { 163 // If this is the old-style GNU extension: 164 // designation ::= identifier ':' 165 // Handle it as a field designator. Otherwise, this must be the start of a 166 // normal expression. 167 if (Tok.is(tok::identifier)) { 168 const IdentifierInfo *FieldName = Tok.getIdentifierInfo(); 169 170 SmallString<256> NewSyntax; 171 llvm::raw_svector_ostream(NewSyntax) << '.' << FieldName->getName() 172 << " = "; 173 174 SourceLocation NameLoc = ConsumeToken(); // Eat the identifier. 175 176 assert(Tok.is(tok::colon) && "MayBeDesignationStart not working properly!"); 177 SourceLocation ColonLoc = ConsumeToken(); 178 179 Diag(NameLoc, diag::ext_gnu_old_style_field_designator) 180 << FixItHint::CreateReplacement(SourceRange(NameLoc, ColonLoc), 181 NewSyntax); 182 183 Designation D; 184 D.AddDesignator(Designator::getField(FieldName, SourceLocation(), NameLoc)); 185 PreferredType.enterDesignatedInitializer( 186 Tok.getLocation(), DesignatorCompletion.PreferredBaseType, D); 187 return Actions.ActOnDesignatedInitializer(D, ColonLoc, true, 188 ParseInitializer()); 189 } 190 191 // Desig - This is initialized when we see our first designator. We may have 192 // an objc message send with no designator, so we don't want to create this 193 // eagerly. 194 Designation Desig; 195 196 // Parse each designator in the designator list until we find an initializer. 197 while (Tok.is(tok::period) || Tok.is(tok::l_square)) { 198 if (Tok.is(tok::period)) { 199 // designator: '.' identifier 200 SourceLocation DotLoc = ConsumeToken(); 201 202 if (Tok.is(tok::code_completion)) { 203 cutOffParsing(); 204 Actions.CodeCompleteDesignator(DesignatorCompletion.PreferredBaseType, 205 DesignatorCompletion.InitExprs, Desig); 206 return ExprError(); 207 } 208 if (Tok.isNot(tok::identifier)) { 209 Diag(Tok.getLocation(), diag::err_expected_field_designator); 210 return ExprError(); 211 } 212 213 Desig.AddDesignator(Designator::getField(Tok.getIdentifierInfo(), DotLoc, 214 Tok.getLocation())); 215 ConsumeToken(); // Eat the identifier. 216 continue; 217 } 218 219 // We must have either an array designator now or an objc message send. 220 assert(Tok.is(tok::l_square) && "Unexpected token!"); 221 222 // Handle the two forms of array designator: 223 // array-designator: '[' constant-expression ']' 224 // array-designator: '[' constant-expression '...' constant-expression ']' 225 // 226 // Also, we have to handle the case where the expression after the 227 // designator an an objc message send: '[' objc-message-expr ']'. 228 // Interesting cases are: 229 // [foo bar] -> objc message send 230 // [foo] -> array designator 231 // [foo ... bar] -> array designator 232 // [4][foo bar] -> obsolete GNU designation with objc message send. 233 // 234 // We do not need to check for an expression starting with [[ here. If it 235 // contains an Objective-C message send, then it is not an ill-formed 236 // attribute. If it is a lambda-expression within an array-designator, then 237 // it will be rejected because a constant-expression cannot begin with a 238 // lambda-expression. 239 InMessageExpressionRAIIObject InMessage(*this, true); 240 241 BalancedDelimiterTracker T(*this, tok::l_square); 242 T.consumeOpen(); 243 SourceLocation StartLoc = T.getOpenLocation(); 244 245 ExprResult Idx; 246 247 // If Objective-C is enabled and this is a typename (class message 248 // send) or send to 'super', parse this as a message send 249 // expression. We handle C++ and C separately, since C++ requires 250 // much more complicated parsing. 251 if (getLangOpts().ObjC && getLangOpts().CPlusPlus) { 252 // Send to 'super'. 253 if (Tok.is(tok::identifier) && Tok.getIdentifierInfo() == Ident_super && 254 NextToken().isNot(tok::period) && 255 getCurScope()->isInObjcMethodScope()) { 256 CheckArrayDesignatorSyntax(*this, StartLoc, Desig); 257 return ParseAssignmentExprWithObjCMessageExprStart( 258 StartLoc, ConsumeToken(), nullptr, nullptr); 259 } 260 261 // Parse the receiver, which is either a type or an expression. 262 bool IsExpr; 263 void *TypeOrExpr; 264 if (ParseObjCXXMessageReceiver(IsExpr, TypeOrExpr)) { 265 SkipUntil(tok::r_square, StopAtSemi); 266 return ExprError(); 267 } 268 269 // If the receiver was a type, we have a class message; parse 270 // the rest of it. 271 if (!IsExpr) { 272 CheckArrayDesignatorSyntax(*this, StartLoc, Desig); 273 return ParseAssignmentExprWithObjCMessageExprStart(StartLoc, 274 SourceLocation(), 275 ParsedType::getFromOpaquePtr(TypeOrExpr), 276 nullptr); 277 } 278 279 // If the receiver was an expression, we still don't know 280 // whether we have a message send or an array designator; just 281 // adopt the expression for further analysis below. 282 // FIXME: potentially-potentially evaluated expression above? 283 Idx = ExprResult(static_cast<Expr*>(TypeOrExpr)); 284 } else if (getLangOpts().ObjC && Tok.is(tok::identifier)) { 285 IdentifierInfo *II = Tok.getIdentifierInfo(); 286 SourceLocation IILoc = Tok.getLocation(); 287 ParsedType ReceiverType; 288 // Three cases. This is a message send to a type: [type foo] 289 // This is a message send to super: [super foo] 290 // This is a message sent to an expr: [super.bar foo] 291 switch (Actions.getObjCMessageKind( 292 getCurScope(), II, IILoc, II == Ident_super, 293 NextToken().is(tok::period), ReceiverType)) { 294 case Sema::ObjCSuperMessage: 295 CheckArrayDesignatorSyntax(*this, StartLoc, Desig); 296 return ParseAssignmentExprWithObjCMessageExprStart( 297 StartLoc, ConsumeToken(), nullptr, nullptr); 298 299 case Sema::ObjCClassMessage: 300 CheckArrayDesignatorSyntax(*this, StartLoc, Desig); 301 ConsumeToken(); // the identifier 302 if (!ReceiverType) { 303 SkipUntil(tok::r_square, StopAtSemi); 304 return ExprError(); 305 } 306 307 // Parse type arguments and protocol qualifiers. 308 if (Tok.is(tok::less)) { 309 SourceLocation NewEndLoc; 310 TypeResult NewReceiverType 311 = parseObjCTypeArgsAndProtocolQualifiers(IILoc, ReceiverType, 312 /*consumeLastToken=*/true, 313 NewEndLoc); 314 if (!NewReceiverType.isUsable()) { 315 SkipUntil(tok::r_square, StopAtSemi); 316 return ExprError(); 317 } 318 319 ReceiverType = NewReceiverType.get(); 320 } 321 322 return ParseAssignmentExprWithObjCMessageExprStart(StartLoc, 323 SourceLocation(), 324 ReceiverType, 325 nullptr); 326 327 case Sema::ObjCInstanceMessage: 328 // Fall through; we'll just parse the expression and 329 // (possibly) treat this like an Objective-C message send 330 // later. 331 break; 332 } 333 } 334 335 // Parse the index expression, if we haven't already gotten one 336 // above (which can only happen in Objective-C++). 337 // Note that we parse this as an assignment expression, not a constant 338 // expression (allowing *=, =, etc) to handle the objc case. Sema needs 339 // to validate that the expression is a constant. 340 // FIXME: We also need to tell Sema that we're in a 341 // potentially-potentially evaluated context. 342 if (!Idx.get()) { 343 Idx = ParseAssignmentExpression(); 344 if (Idx.isInvalid()) { 345 SkipUntil(tok::r_square, StopAtSemi); 346 return Idx; 347 } 348 } 349 350 // Given an expression, we could either have a designator (if the next 351 // tokens are '...' or ']' or an objc message send. If this is an objc 352 // message send, handle it now. An objc-message send is the start of 353 // an assignment-expression production. 354 if (getLangOpts().ObjC && Tok.isNot(tok::ellipsis) && 355 Tok.isNot(tok::r_square)) { 356 CheckArrayDesignatorSyntax(*this, Tok.getLocation(), Desig); 357 return ParseAssignmentExprWithObjCMessageExprStart( 358 StartLoc, SourceLocation(), nullptr, Idx.get()); 359 } 360 361 // If this is a normal array designator, remember it. 362 if (Tok.isNot(tok::ellipsis)) { 363 Desig.AddDesignator(Designator::getArray(Idx.get(), StartLoc)); 364 } else { 365 // Handle the gnu array range extension. 366 Diag(Tok, diag::ext_gnu_array_range); 367 SourceLocation EllipsisLoc = ConsumeToken(); 368 369 ExprResult RHS(ParseConstantExpression()); 370 if (RHS.isInvalid()) { 371 SkipUntil(tok::r_square, StopAtSemi); 372 return RHS; 373 } 374 Desig.AddDesignator(Designator::getArrayRange(Idx.get(), 375 RHS.get(), 376 StartLoc, EllipsisLoc)); 377 } 378 379 T.consumeClose(); 380 Desig.getDesignator(Desig.getNumDesignators() - 1).setRBracketLoc( 381 T.getCloseLocation()); 382 } 383 384 // Okay, we're done with the designator sequence. We know that there must be 385 // at least one designator, because the only case we can get into this method 386 // without a designator is when we have an objc message send. That case is 387 // handled and returned from above. 388 assert(!Desig.empty() && "Designator is empty?"); 389 390 // Handle a normal designator sequence end, which is an equal. 391 if (Tok.is(tok::equal)) { 392 SourceLocation EqualLoc = ConsumeToken(); 393 PreferredType.enterDesignatedInitializer( 394 Tok.getLocation(), DesignatorCompletion.PreferredBaseType, Desig); 395 return Actions.ActOnDesignatedInitializer(Desig, EqualLoc, false, 396 ParseInitializer()); 397 } 398 399 // Handle a C++20 braced designated initialization, which results in 400 // direct-list-initialization of the aggregate element. We allow this as an 401 // extension from C++11 onwards (when direct-list-initialization was added). 402 if (Tok.is(tok::l_brace) && getLangOpts().CPlusPlus11) { 403 PreferredType.enterDesignatedInitializer( 404 Tok.getLocation(), DesignatorCompletion.PreferredBaseType, Desig); 405 return Actions.ActOnDesignatedInitializer(Desig, SourceLocation(), false, 406 ParseBraceInitializer()); 407 } 408 409 // We read some number of designators and found something that isn't an = or 410 // an initializer. If we have exactly one array designator, this 411 // is the GNU 'designation: array-designator' extension. Otherwise, it is a 412 // parse error. 413 if (Desig.getNumDesignators() == 1 && 414 (Desig.getDesignator(0).isArrayDesignator() || 415 Desig.getDesignator(0).isArrayRangeDesignator())) { 416 Diag(Tok, diag::ext_gnu_missing_equal_designator) 417 << FixItHint::CreateInsertion(Tok.getLocation(), "= "); 418 return Actions.ActOnDesignatedInitializer(Desig, Tok.getLocation(), 419 true, ParseInitializer()); 420 } 421 422 Diag(Tok, diag::err_expected_equal_designator); 423 return ExprError(); 424 } 425 426 /// ParseBraceInitializer - Called when parsing an initializer that has a 427 /// leading open brace. 428 /// 429 /// initializer: [C99 6.7.8] 430 /// '{' initializer-list '}' 431 /// '{' initializer-list ',' '}' 432 /// [GNU] '{' '}' 433 /// 434 /// initializer-list: 435 /// designation[opt] initializer ...[opt] 436 /// initializer-list ',' designation[opt] initializer ...[opt] 437 /// 438 ExprResult Parser::ParseBraceInitializer() { 439 InMessageExpressionRAIIObject InMessage(*this, false); 440 441 BalancedDelimiterTracker T(*this, tok::l_brace); 442 T.consumeOpen(); 443 SourceLocation LBraceLoc = T.getOpenLocation(); 444 445 /// InitExprs - This is the actual list of expressions contained in the 446 /// initializer. 447 ExprVector InitExprs; 448 449 if (Tok.is(tok::r_brace)) { 450 // Empty initializers are a C++ feature and a GNU extension to C. 451 if (!getLangOpts().CPlusPlus) 452 Diag(LBraceLoc, diag::ext_gnu_empty_initializer); 453 // Match the '}'. 454 return Actions.ActOnInitList(LBraceLoc, None, ConsumeBrace()); 455 } 456 457 // Enter an appropriate expression evaluation context for an initializer list. 458 EnterExpressionEvaluationContext EnterContext( 459 Actions, EnterExpressionEvaluationContext::InitList); 460 461 bool InitExprsOk = true; 462 DesignatorCompletionInfo DesignatorCompletion{ 463 InitExprs, 464 PreferredType.get(T.getOpenLocation()), 465 }; 466 467 while (1) { 468 // Handle Microsoft __if_exists/if_not_exists if necessary. 469 if (getLangOpts().MicrosoftExt && (Tok.is(tok::kw___if_exists) || 470 Tok.is(tok::kw___if_not_exists))) { 471 if (ParseMicrosoftIfExistsBraceInitializer(InitExprs, InitExprsOk)) { 472 if (Tok.isNot(tok::comma)) break; 473 ConsumeToken(); 474 } 475 if (Tok.is(tok::r_brace)) break; 476 continue; 477 } 478 479 // Parse: designation[opt] initializer 480 481 // If we know that this cannot be a designation, just parse the nested 482 // initializer directly. 483 ExprResult SubElt; 484 if (MayBeDesignationStart()) 485 SubElt = ParseInitializerWithPotentialDesignator(DesignatorCompletion); 486 else 487 SubElt = ParseInitializer(); 488 489 if (Tok.is(tok::ellipsis)) 490 SubElt = Actions.ActOnPackExpansion(SubElt.get(), ConsumeToken()); 491 492 SubElt = Actions.CorrectDelayedTyposInExpr(SubElt.get()); 493 494 // If we couldn't parse the subelement, bail out. 495 if (SubElt.isUsable()) { 496 InitExprs.push_back(SubElt.get()); 497 } else { 498 InitExprsOk = false; 499 500 // We have two ways to try to recover from this error: if the code looks 501 // grammatically ok (i.e. we have a comma coming up) try to continue 502 // parsing the rest of the initializer. This allows us to emit 503 // diagnostics for later elements that we find. If we don't see a comma, 504 // assume there is a parse error, and just skip to recover. 505 // FIXME: This comment doesn't sound right. If there is a r_brace 506 // immediately, it can't be an error, since there is no other way of 507 // leaving this loop except through this if. 508 if (Tok.isNot(tok::comma)) { 509 SkipUntil(tok::r_brace, StopBeforeMatch); 510 break; 511 } 512 } 513 514 // If we don't have a comma continued list, we're done. 515 if (Tok.isNot(tok::comma)) break; 516 517 // TODO: save comma locations if some client cares. 518 ConsumeToken(); 519 520 // Handle trailing comma. 521 if (Tok.is(tok::r_brace)) break; 522 } 523 524 bool closed = !T.consumeClose(); 525 526 if (InitExprsOk && closed) 527 return Actions.ActOnInitList(LBraceLoc, InitExprs, 528 T.getCloseLocation()); 529 530 return ExprError(); // an error occurred. 531 } 532 533 534 // Return true if a comma (or closing brace) is necessary after the 535 // __if_exists/if_not_exists statement. 536 bool Parser::ParseMicrosoftIfExistsBraceInitializer(ExprVector &InitExprs, 537 bool &InitExprsOk) { 538 bool trailingComma = false; 539 IfExistsCondition Result; 540 if (ParseMicrosoftIfExistsCondition(Result)) 541 return false; 542 543 BalancedDelimiterTracker Braces(*this, tok::l_brace); 544 if (Braces.consumeOpen()) { 545 Diag(Tok, diag::err_expected) << tok::l_brace; 546 return false; 547 } 548 549 switch (Result.Behavior) { 550 case IEB_Parse: 551 // Parse the declarations below. 552 break; 553 554 case IEB_Dependent: 555 Diag(Result.KeywordLoc, diag::warn_microsoft_dependent_exists) 556 << Result.IsIfExists; 557 // Fall through to skip. 558 LLVM_FALLTHROUGH; 559 560 case IEB_Skip: 561 Braces.skipToEnd(); 562 return false; 563 } 564 565 DesignatorCompletionInfo DesignatorCompletion{ 566 InitExprs, 567 PreferredType.get(Braces.getOpenLocation()), 568 }; 569 while (!isEofOrEom()) { 570 trailingComma = false; 571 // If we know that this cannot be a designation, just parse the nested 572 // initializer directly. 573 ExprResult SubElt; 574 if (MayBeDesignationStart()) 575 SubElt = ParseInitializerWithPotentialDesignator(DesignatorCompletion); 576 else 577 SubElt = ParseInitializer(); 578 579 if (Tok.is(tok::ellipsis)) 580 SubElt = Actions.ActOnPackExpansion(SubElt.get(), ConsumeToken()); 581 582 // If we couldn't parse the subelement, bail out. 583 if (!SubElt.isInvalid()) 584 InitExprs.push_back(SubElt.get()); 585 else 586 InitExprsOk = false; 587 588 if (Tok.is(tok::comma)) { 589 ConsumeToken(); 590 trailingComma = true; 591 } 592 593 if (Tok.is(tok::r_brace)) 594 break; 595 } 596 597 Braces.consumeClose(); 598 599 return !trailingComma; 600 } 601