xref: /freebsd/contrib/llvm-project/clang/lib/Parse/ParseInit.cpp (revision 833a452e9f082a7982a31c21f0da437dbbe0a39d)
1 //===--- ParseInit.cpp - Initializer Parsing ------------------------------===//
2 //
3 // Part of the LLVM Project, under the Apache License v2.0 with LLVM Exceptions.
4 // See https://llvm.org/LICENSE.txt for license information.
5 // SPDX-License-Identifier: Apache-2.0 WITH LLVM-exception
6 //
7 //===----------------------------------------------------------------------===//
8 //
9 // This file implements initializer parsing as specified by C99 6.7.8.
10 //
11 //===----------------------------------------------------------------------===//
12 
13 #include "clang/Basic/TokenKinds.h"
14 #include "clang/Parse/ParseDiagnostic.h"
15 #include "clang/Parse/Parser.h"
16 #include "clang/Parse/RAIIObjectsForParser.h"
17 #include "clang/Sema/Designator.h"
18 #include "clang/Sema/Ownership.h"
19 #include "clang/Sema/Scope.h"
20 #include "llvm/ADT/STLExtras.h"
21 #include "llvm/ADT/SmallString.h"
22 using namespace clang;
23 
24 
25 /// MayBeDesignationStart - Return true if the current token might be the start
26 /// of a designator.  If we can tell it is impossible that it is a designator,
27 /// return false.
28 bool Parser::MayBeDesignationStart() {
29   switch (Tok.getKind()) {
30   default:
31     return false;
32 
33   case tok::period:      // designator: '.' identifier
34     return true;
35 
36   case tok::l_square: {  // designator: array-designator
37     if (!PP.getLangOpts().CPlusPlus11)
38       return true;
39 
40     // C++11 lambda expressions and C99 designators can be ambiguous all the
41     // way through the closing ']' and to the next character. Handle the easy
42     // cases here, and fall back to tentative parsing if those fail.
43     switch (PP.LookAhead(0).getKind()) {
44     case tok::equal:
45     case tok::ellipsis:
46     case tok::r_square:
47       // Definitely starts a lambda expression.
48       return false;
49 
50     case tok::amp:
51     case tok::kw_this:
52     case tok::star:
53     case tok::identifier:
54       // We have to do additional analysis, because these could be the
55       // start of a constant expression or a lambda capture list.
56       break;
57 
58     default:
59       // Anything not mentioned above cannot occur following a '[' in a
60       // lambda expression.
61       return true;
62     }
63 
64     // Handle the complicated case below.
65     break;
66   }
67   case tok::identifier:  // designation: identifier ':'
68     return PP.LookAhead(0).is(tok::colon);
69   }
70 
71   // Parse up to (at most) the token after the closing ']' to determine
72   // whether this is a C99 designator or a lambda.
73   RevertingTentativeParsingAction Tentative(*this);
74 
75   LambdaIntroducer Intro;
76   LambdaIntroducerTentativeParse ParseResult;
77   if (ParseLambdaIntroducer(Intro, &ParseResult)) {
78     // Hit and diagnosed an error in a lambda.
79     // FIXME: Tell the caller this happened so they can recover.
80     return true;
81   }
82 
83   switch (ParseResult) {
84   case LambdaIntroducerTentativeParse::Success:
85   case LambdaIntroducerTentativeParse::Incomplete:
86     // Might be a lambda-expression. Keep looking.
87     // FIXME: If our tentative parse was not incomplete, parse the lambda from
88     // here rather than throwing away then reparsing the LambdaIntroducer.
89     break;
90 
91   case LambdaIntroducerTentativeParse::MessageSend:
92   case LambdaIntroducerTentativeParse::Invalid:
93     // Can't be a lambda-expression. Treat it as a designator.
94     // FIXME: Should we disambiguate against a message-send?
95     return true;
96   }
97 
98   // Once we hit the closing square bracket, we look at the next
99   // token. If it's an '=', this is a designator. Otherwise, it's a
100   // lambda expression. This decision favors lambdas over the older
101   // GNU designator syntax, which allows one to omit the '=', but is
102   // consistent with GCC.
103   return Tok.is(tok::equal);
104 }
105 
106 static void CheckArrayDesignatorSyntax(Parser &P, SourceLocation Loc,
107                                        Designation &Desig) {
108   // If we have exactly one array designator, this used the GNU
109   // 'designation: array-designator' extension, otherwise there should be no
110   // designators at all!
111   if (Desig.getNumDesignators() == 1 &&
112       (Desig.getDesignator(0).isArrayDesignator() ||
113        Desig.getDesignator(0).isArrayRangeDesignator()))
114     P.Diag(Loc, diag::ext_gnu_missing_equal_designator);
115   else if (Desig.getNumDesignators() > 0)
116     P.Diag(Loc, diag::err_expected_equal_designator);
117 }
118 
119 /// ParseInitializerWithPotentialDesignator - Parse the 'initializer' production
120 /// checking to see if the token stream starts with a designator.
121 ///
122 /// C99:
123 ///
124 ///       designation:
125 ///         designator-list '='
126 /// [GNU]   array-designator
127 /// [GNU]   identifier ':'
128 ///
129 ///       designator-list:
130 ///         designator
131 ///         designator-list designator
132 ///
133 ///       designator:
134 ///         array-designator
135 ///         '.' identifier
136 ///
137 ///       array-designator:
138 ///         '[' constant-expression ']'
139 /// [GNU]   '[' constant-expression '...' constant-expression ']'
140 ///
141 /// C++20:
142 ///
143 ///       designated-initializer-list:
144 ///         designated-initializer-clause
145 ///         designated-initializer-list ',' designated-initializer-clause
146 ///
147 ///       designated-initializer-clause:
148 ///         designator brace-or-equal-initializer
149 ///
150 ///       designator:
151 ///         '.' identifier
152 ///
153 /// We allow the C99 syntax extensions in C++20, but do not allow the C++20
154 /// extension (a braced-init-list after the designator with no '=') in C99.
155 ///
156 /// NOTE: [OBC] allows '[ objc-receiver objc-message-args ]' as an
157 /// initializer (because it is an expression).  We need to consider this case
158 /// when parsing array designators.
159 ///
160 /// \p CodeCompleteCB is called with Designation parsed so far.
161 ExprResult Parser::ParseInitializerWithPotentialDesignator(
162     DesignatorCompletionInfo DesignatorCompletion) {
163   // If this is the old-style GNU extension:
164   //   designation ::= identifier ':'
165   // Handle it as a field designator.  Otherwise, this must be the start of a
166   // normal expression.
167   if (Tok.is(tok::identifier)) {
168     const IdentifierInfo *FieldName = Tok.getIdentifierInfo();
169 
170     SmallString<256> NewSyntax;
171     llvm::raw_svector_ostream(NewSyntax) << '.' << FieldName->getName()
172                                          << " = ";
173 
174     SourceLocation NameLoc = ConsumeToken(); // Eat the identifier.
175 
176     assert(Tok.is(tok::colon) && "MayBeDesignationStart not working properly!");
177     SourceLocation ColonLoc = ConsumeToken();
178 
179     Diag(NameLoc, diag::ext_gnu_old_style_field_designator)
180       << FixItHint::CreateReplacement(SourceRange(NameLoc, ColonLoc),
181                                       NewSyntax);
182 
183     Designation D;
184     D.AddDesignator(Designator::getField(FieldName, SourceLocation(), NameLoc));
185     PreferredType.enterDesignatedInitializer(
186         Tok.getLocation(), DesignatorCompletion.PreferredBaseType, D);
187     return Actions.ActOnDesignatedInitializer(D, ColonLoc, true,
188                                               ParseInitializer());
189   }
190 
191   // Desig - This is initialized when we see our first designator.  We may have
192   // an objc message send with no designator, so we don't want to create this
193   // eagerly.
194   Designation Desig;
195 
196   // Parse each designator in the designator list until we find an initializer.
197   while (Tok.is(tok::period) || Tok.is(tok::l_square)) {
198     if (Tok.is(tok::period)) {
199       // designator: '.' identifier
200       SourceLocation DotLoc = ConsumeToken();
201 
202       if (Tok.is(tok::code_completion)) {
203         cutOffParsing();
204         Actions.CodeCompleteDesignator(DesignatorCompletion.PreferredBaseType,
205                                        DesignatorCompletion.InitExprs, Desig);
206         return ExprError();
207       }
208       if (Tok.isNot(tok::identifier)) {
209         Diag(Tok.getLocation(), diag::err_expected_field_designator);
210         return ExprError();
211       }
212 
213       Desig.AddDesignator(Designator::getField(Tok.getIdentifierInfo(), DotLoc,
214                                                Tok.getLocation()));
215       ConsumeToken(); // Eat the identifier.
216       continue;
217     }
218 
219     // We must have either an array designator now or an objc message send.
220     assert(Tok.is(tok::l_square) && "Unexpected token!");
221 
222     // Handle the two forms of array designator:
223     //   array-designator: '[' constant-expression ']'
224     //   array-designator: '[' constant-expression '...' constant-expression ']'
225     //
226     // Also, we have to handle the case where the expression after the
227     // designator an an objc message send: '[' objc-message-expr ']'.
228     // Interesting cases are:
229     //   [foo bar]         -> objc message send
230     //   [foo]             -> array designator
231     //   [foo ... bar]     -> array designator
232     //   [4][foo bar]      -> obsolete GNU designation with objc message send.
233     //
234     // We do not need to check for an expression starting with [[ here. If it
235     // contains an Objective-C message send, then it is not an ill-formed
236     // attribute. If it is a lambda-expression within an array-designator, then
237     // it will be rejected because a constant-expression cannot begin with a
238     // lambda-expression.
239     InMessageExpressionRAIIObject InMessage(*this, true);
240 
241     BalancedDelimiterTracker T(*this, tok::l_square);
242     T.consumeOpen();
243     SourceLocation StartLoc = T.getOpenLocation();
244 
245     ExprResult Idx;
246 
247     // If Objective-C is enabled and this is a typename (class message
248     // send) or send to 'super', parse this as a message send
249     // expression.  We handle C++ and C separately, since C++ requires
250     // much more complicated parsing.
251     if  (getLangOpts().ObjC && getLangOpts().CPlusPlus) {
252       // Send to 'super'.
253       if (Tok.is(tok::identifier) && Tok.getIdentifierInfo() == Ident_super &&
254           NextToken().isNot(tok::period) &&
255           getCurScope()->isInObjcMethodScope()) {
256         CheckArrayDesignatorSyntax(*this, StartLoc, Desig);
257         return ParseAssignmentExprWithObjCMessageExprStart(
258             StartLoc, ConsumeToken(), nullptr, nullptr);
259       }
260 
261       // Parse the receiver, which is either a type or an expression.
262       bool IsExpr;
263       void *TypeOrExpr;
264       if (ParseObjCXXMessageReceiver(IsExpr, TypeOrExpr)) {
265         SkipUntil(tok::r_square, StopAtSemi);
266         return ExprError();
267       }
268 
269       // If the receiver was a type, we have a class message; parse
270       // the rest of it.
271       if (!IsExpr) {
272         CheckArrayDesignatorSyntax(*this, StartLoc, Desig);
273         return ParseAssignmentExprWithObjCMessageExprStart(StartLoc,
274                                                            SourceLocation(),
275                                    ParsedType::getFromOpaquePtr(TypeOrExpr),
276                                                            nullptr);
277       }
278 
279       // If the receiver was an expression, we still don't know
280       // whether we have a message send or an array designator; just
281       // adopt the expression for further analysis below.
282       // FIXME: potentially-potentially evaluated expression above?
283       Idx = ExprResult(static_cast<Expr*>(TypeOrExpr));
284     } else if (getLangOpts().ObjC && Tok.is(tok::identifier)) {
285       IdentifierInfo *II = Tok.getIdentifierInfo();
286       SourceLocation IILoc = Tok.getLocation();
287       ParsedType ReceiverType;
288       // Three cases. This is a message send to a type: [type foo]
289       // This is a message send to super:  [super foo]
290       // This is a message sent to an expr:  [super.bar foo]
291       switch (Actions.getObjCMessageKind(
292           getCurScope(), II, IILoc, II == Ident_super,
293           NextToken().is(tok::period), ReceiverType)) {
294       case Sema::ObjCSuperMessage:
295         CheckArrayDesignatorSyntax(*this, StartLoc, Desig);
296         return ParseAssignmentExprWithObjCMessageExprStart(
297             StartLoc, ConsumeToken(), nullptr, nullptr);
298 
299       case Sema::ObjCClassMessage:
300         CheckArrayDesignatorSyntax(*this, StartLoc, Desig);
301         ConsumeToken(); // the identifier
302         if (!ReceiverType) {
303           SkipUntil(tok::r_square, StopAtSemi);
304           return ExprError();
305         }
306 
307         // Parse type arguments and protocol qualifiers.
308         if (Tok.is(tok::less)) {
309           SourceLocation NewEndLoc;
310           TypeResult NewReceiverType
311             = parseObjCTypeArgsAndProtocolQualifiers(IILoc, ReceiverType,
312                                                      /*consumeLastToken=*/true,
313                                                      NewEndLoc);
314           if (!NewReceiverType.isUsable()) {
315             SkipUntil(tok::r_square, StopAtSemi);
316             return ExprError();
317           }
318 
319           ReceiverType = NewReceiverType.get();
320         }
321 
322         return ParseAssignmentExprWithObjCMessageExprStart(StartLoc,
323                                                            SourceLocation(),
324                                                            ReceiverType,
325                                                            nullptr);
326 
327       case Sema::ObjCInstanceMessage:
328         // Fall through; we'll just parse the expression and
329         // (possibly) treat this like an Objective-C message send
330         // later.
331         break;
332       }
333     }
334 
335     // Parse the index expression, if we haven't already gotten one
336     // above (which can only happen in Objective-C++).
337     // Note that we parse this as an assignment expression, not a constant
338     // expression (allowing *=, =, etc) to handle the objc case.  Sema needs
339     // to validate that the expression is a constant.
340     // FIXME: We also need to tell Sema that we're in a
341     // potentially-potentially evaluated context.
342     if (!Idx.get()) {
343       Idx = ParseAssignmentExpression();
344       if (Idx.isInvalid()) {
345         SkipUntil(tok::r_square, StopAtSemi);
346         return Idx;
347       }
348     }
349 
350     // Given an expression, we could either have a designator (if the next
351     // tokens are '...' or ']' or an objc message send.  If this is an objc
352     // message send, handle it now.  An objc-message send is the start of
353     // an assignment-expression production.
354     if (getLangOpts().ObjC && Tok.isNot(tok::ellipsis) &&
355         Tok.isNot(tok::r_square)) {
356       CheckArrayDesignatorSyntax(*this, Tok.getLocation(), Desig);
357       return ParseAssignmentExprWithObjCMessageExprStart(
358           StartLoc, SourceLocation(), nullptr, Idx.get());
359     }
360 
361     // If this is a normal array designator, remember it.
362     if (Tok.isNot(tok::ellipsis)) {
363       Desig.AddDesignator(Designator::getArray(Idx.get(), StartLoc));
364     } else {
365       // Handle the gnu array range extension.
366       Diag(Tok, diag::ext_gnu_array_range);
367       SourceLocation EllipsisLoc = ConsumeToken();
368 
369       ExprResult RHS(ParseConstantExpression());
370       if (RHS.isInvalid()) {
371         SkipUntil(tok::r_square, StopAtSemi);
372         return RHS;
373       }
374       Desig.AddDesignator(Designator::getArrayRange(Idx.get(),
375                                                     RHS.get(),
376                                                     StartLoc, EllipsisLoc));
377     }
378 
379     T.consumeClose();
380     Desig.getDesignator(Desig.getNumDesignators() - 1).setRBracketLoc(
381                                                         T.getCloseLocation());
382   }
383 
384   // Okay, we're done with the designator sequence.  We know that there must be
385   // at least one designator, because the only case we can get into this method
386   // without a designator is when we have an objc message send.  That case is
387   // handled and returned from above.
388   assert(!Desig.empty() && "Designator is empty?");
389 
390   // Handle a normal designator sequence end, which is an equal.
391   if (Tok.is(tok::equal)) {
392     SourceLocation EqualLoc = ConsumeToken();
393     PreferredType.enterDesignatedInitializer(
394         Tok.getLocation(), DesignatorCompletion.PreferredBaseType, Desig);
395     return Actions.ActOnDesignatedInitializer(Desig, EqualLoc, false,
396                                               ParseInitializer());
397   }
398 
399   // Handle a C++20 braced designated initialization, which results in
400   // direct-list-initialization of the aggregate element. We allow this as an
401   // extension from C++11 onwards (when direct-list-initialization was added).
402   if (Tok.is(tok::l_brace) && getLangOpts().CPlusPlus11) {
403     PreferredType.enterDesignatedInitializer(
404         Tok.getLocation(), DesignatorCompletion.PreferredBaseType, Desig);
405     return Actions.ActOnDesignatedInitializer(Desig, SourceLocation(), false,
406                                               ParseBraceInitializer());
407   }
408 
409   // We read some number of designators and found something that isn't an = or
410   // an initializer.  If we have exactly one array designator, this
411   // is the GNU 'designation: array-designator' extension.  Otherwise, it is a
412   // parse error.
413   if (Desig.getNumDesignators() == 1 &&
414       (Desig.getDesignator(0).isArrayDesignator() ||
415        Desig.getDesignator(0).isArrayRangeDesignator())) {
416     Diag(Tok, diag::ext_gnu_missing_equal_designator)
417       << FixItHint::CreateInsertion(Tok.getLocation(), "= ");
418     return Actions.ActOnDesignatedInitializer(Desig, Tok.getLocation(),
419                                               true, ParseInitializer());
420   }
421 
422   Diag(Tok, diag::err_expected_equal_designator);
423   return ExprError();
424 }
425 
426 /// ParseBraceInitializer - Called when parsing an initializer that has a
427 /// leading open brace.
428 ///
429 ///       initializer: [C99 6.7.8]
430 ///         '{' initializer-list '}'
431 ///         '{' initializer-list ',' '}'
432 /// [GNU]   '{' '}'
433 ///
434 ///       initializer-list:
435 ///         designation[opt] initializer ...[opt]
436 ///         initializer-list ',' designation[opt] initializer ...[opt]
437 ///
438 ExprResult Parser::ParseBraceInitializer() {
439   InMessageExpressionRAIIObject InMessage(*this, false);
440 
441   BalancedDelimiterTracker T(*this, tok::l_brace);
442   T.consumeOpen();
443   SourceLocation LBraceLoc = T.getOpenLocation();
444 
445   /// InitExprs - This is the actual list of expressions contained in the
446   /// initializer.
447   ExprVector InitExprs;
448 
449   if (Tok.is(tok::r_brace)) {
450     // Empty initializers are a C++ feature and a GNU extension to C.
451     if (!getLangOpts().CPlusPlus)
452       Diag(LBraceLoc, diag::ext_gnu_empty_initializer);
453     // Match the '}'.
454     return Actions.ActOnInitList(LBraceLoc, None, ConsumeBrace());
455   }
456 
457   // Enter an appropriate expression evaluation context for an initializer list.
458   EnterExpressionEvaluationContext EnterContext(
459       Actions, EnterExpressionEvaluationContext::InitList);
460 
461   bool InitExprsOk = true;
462   DesignatorCompletionInfo DesignatorCompletion{
463       InitExprs,
464       PreferredType.get(T.getOpenLocation()),
465   };
466 
467   while (1) {
468     // Handle Microsoft __if_exists/if_not_exists if necessary.
469     if (getLangOpts().MicrosoftExt && (Tok.is(tok::kw___if_exists) ||
470         Tok.is(tok::kw___if_not_exists))) {
471       if (ParseMicrosoftIfExistsBraceInitializer(InitExprs, InitExprsOk)) {
472         if (Tok.isNot(tok::comma)) break;
473         ConsumeToken();
474       }
475       if (Tok.is(tok::r_brace)) break;
476       continue;
477     }
478 
479     // Parse: designation[opt] initializer
480 
481     // If we know that this cannot be a designation, just parse the nested
482     // initializer directly.
483     ExprResult SubElt;
484     if (MayBeDesignationStart())
485       SubElt = ParseInitializerWithPotentialDesignator(DesignatorCompletion);
486     else
487       SubElt = ParseInitializer();
488 
489     if (Tok.is(tok::ellipsis))
490       SubElt = Actions.ActOnPackExpansion(SubElt.get(), ConsumeToken());
491 
492     SubElt = Actions.CorrectDelayedTyposInExpr(SubElt.get());
493 
494     // If we couldn't parse the subelement, bail out.
495     if (SubElt.isUsable()) {
496       InitExprs.push_back(SubElt.get());
497     } else {
498       InitExprsOk = false;
499 
500       // We have two ways to try to recover from this error: if the code looks
501       // grammatically ok (i.e. we have a comma coming up) try to continue
502       // parsing the rest of the initializer.  This allows us to emit
503       // diagnostics for later elements that we find.  If we don't see a comma,
504       // assume there is a parse error, and just skip to recover.
505       // FIXME: This comment doesn't sound right. If there is a r_brace
506       // immediately, it can't be an error, since there is no other way of
507       // leaving this loop except through this if.
508       if (Tok.isNot(tok::comma)) {
509         SkipUntil(tok::r_brace, StopBeforeMatch);
510         break;
511       }
512     }
513 
514     // If we don't have a comma continued list, we're done.
515     if (Tok.isNot(tok::comma)) break;
516 
517     // TODO: save comma locations if some client cares.
518     ConsumeToken();
519 
520     // Handle trailing comma.
521     if (Tok.is(tok::r_brace)) break;
522   }
523 
524   bool closed = !T.consumeClose();
525 
526   if (InitExprsOk && closed)
527     return Actions.ActOnInitList(LBraceLoc, InitExprs,
528                                  T.getCloseLocation());
529 
530   return ExprError(); // an error occurred.
531 }
532 
533 
534 // Return true if a comma (or closing brace) is necessary after the
535 // __if_exists/if_not_exists statement.
536 bool Parser::ParseMicrosoftIfExistsBraceInitializer(ExprVector &InitExprs,
537                                                     bool &InitExprsOk) {
538   bool trailingComma = false;
539   IfExistsCondition Result;
540   if (ParseMicrosoftIfExistsCondition(Result))
541     return false;
542 
543   BalancedDelimiterTracker Braces(*this, tok::l_brace);
544   if (Braces.consumeOpen()) {
545     Diag(Tok, diag::err_expected) << tok::l_brace;
546     return false;
547   }
548 
549   switch (Result.Behavior) {
550   case IEB_Parse:
551     // Parse the declarations below.
552     break;
553 
554   case IEB_Dependent:
555     Diag(Result.KeywordLoc, diag::warn_microsoft_dependent_exists)
556       << Result.IsIfExists;
557     // Fall through to skip.
558     LLVM_FALLTHROUGH;
559 
560   case IEB_Skip:
561     Braces.skipToEnd();
562     return false;
563   }
564 
565   DesignatorCompletionInfo DesignatorCompletion{
566       InitExprs,
567       PreferredType.get(Braces.getOpenLocation()),
568   };
569   while (!isEofOrEom()) {
570     trailingComma = false;
571     // If we know that this cannot be a designation, just parse the nested
572     // initializer directly.
573     ExprResult SubElt;
574     if (MayBeDesignationStart())
575       SubElt = ParseInitializerWithPotentialDesignator(DesignatorCompletion);
576     else
577       SubElt = ParseInitializer();
578 
579     if (Tok.is(tok::ellipsis))
580       SubElt = Actions.ActOnPackExpansion(SubElt.get(), ConsumeToken());
581 
582     // If we couldn't parse the subelement, bail out.
583     if (!SubElt.isInvalid())
584       InitExprs.push_back(SubElt.get());
585     else
586       InitExprsOk = false;
587 
588     if (Tok.is(tok::comma)) {
589       ConsumeToken();
590       trailingComma = true;
591     }
592 
593     if (Tok.is(tok::r_brace))
594       break;
595   }
596 
597   Braces.consumeClose();
598 
599   return !trailingComma;
600 }
601