• Home
  • Line#
  • Scopes#
  • Navigate#
  • Raw
  • Download
1 //===--- MacroExpansion.cpp - Top level Macro Expansion -------------------===//
2 //
3 //                     The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file implements the top level handling of macro expasion for the
11 // preprocessor.
12 //
13 //===----------------------------------------------------------------------===//
14 
15 #include "clang/Lex/Preprocessor.h"
16 #include "clang/Lex/MacroArgs.h"
17 #include "clang/Basic/FileManager.h"
18 #include "clang/Basic/SourceManager.h"
19 #include "clang/Basic/TargetInfo.h"
20 #include "clang/Lex/CodeCompletionHandler.h"
21 #include "clang/Lex/ExternalPreprocessorSource.h"
22 #include "clang/Lex/LexDiagnostic.h"
23 #include "clang/Lex/MacroInfo.h"
24 #include "llvm/ADT/STLExtras.h"
25 #include "llvm/ADT/SmallString.h"
26 #include "llvm/ADT/StringSwitch.h"
27 #include "llvm/Config/llvm-config.h"
28 #include "llvm/Support/ErrorHandling.h"
29 #include "llvm/Support/Format.h"
30 #include "llvm/Support/raw_ostream.h"
31 #include <cstdio>
32 #include <ctime>
33 using namespace clang;
34 
35 MacroDirective *
getMacroDirectiveHistory(const IdentifierInfo * II) const36 Preprocessor::getMacroDirectiveHistory(const IdentifierInfo *II) const {
37   assert(II->hadMacroDefinition() && "Identifier has not been not a macro!");
38 
39   macro_iterator Pos = Macros.find(II);
40   assert(Pos != Macros.end() && "Identifier macro info is missing!");
41   return Pos->second;
42 }
43 
appendMacroDirective(IdentifierInfo * II,MacroDirective * MD)44 void Preprocessor::appendMacroDirective(IdentifierInfo *II, MacroDirective *MD){
45   assert(MD && "MacroDirective should be non-zero!");
46   assert(!MD->getPrevious() && "Already attached to a MacroDirective history.");
47 
48   MacroDirective *&StoredMD = Macros[II];
49   MD->setPrevious(StoredMD);
50   StoredMD = MD;
51   II->setHasMacroDefinition(MD->isDefined());
52   bool isImportedMacro = isa<DefMacroDirective>(MD) &&
53                          cast<DefMacroDirective>(MD)->isImported();
54   if (II->isFromAST() && !isImportedMacro)
55     II->setChangedSinceDeserialization();
56 }
57 
setLoadedMacroDirective(IdentifierInfo * II,MacroDirective * MD)58 void Preprocessor::setLoadedMacroDirective(IdentifierInfo *II,
59                                            MacroDirective *MD) {
60   assert(II && MD);
61   MacroDirective *&StoredMD = Macros[II];
62   assert(!StoredMD &&
63          "the macro history was modified before initializing it from a pch");
64   StoredMD = MD;
65   // Setup the identifier as having associated macro history.
66   II->setHasMacroDefinition(true);
67   if (!MD->isDefined())
68     II->setHasMacroDefinition(false);
69 }
70 
71 /// RegisterBuiltinMacro - Register the specified identifier in the identifier
72 /// table and mark it as a builtin macro to be expanded.
RegisterBuiltinMacro(Preprocessor & PP,const char * Name)73 static IdentifierInfo *RegisterBuiltinMacro(Preprocessor &PP, const char *Name){
74   // Get the identifier.
75   IdentifierInfo *Id = PP.getIdentifierInfo(Name);
76 
77   // Mark it as being a macro that is builtin.
78   MacroInfo *MI = PP.AllocateMacroInfo(SourceLocation());
79   MI->setIsBuiltinMacro();
80   PP.appendDefMacroDirective(Id, MI);
81   return Id;
82 }
83 
84 
85 /// RegisterBuiltinMacros - Register builtin macros, such as __LINE__ with the
86 /// identifier table.
RegisterBuiltinMacros()87 void Preprocessor::RegisterBuiltinMacros() {
88   Ident__LINE__ = RegisterBuiltinMacro(*this, "__LINE__");
89   Ident__FILE__ = RegisterBuiltinMacro(*this, "__FILE__");
90   Ident__DATE__ = RegisterBuiltinMacro(*this, "__DATE__");
91   Ident__TIME__ = RegisterBuiltinMacro(*this, "__TIME__");
92   Ident__COUNTER__ = RegisterBuiltinMacro(*this, "__COUNTER__");
93   Ident_Pragma  = RegisterBuiltinMacro(*this, "_Pragma");
94 
95   // GCC Extensions.
96   Ident__BASE_FILE__     = RegisterBuiltinMacro(*this, "__BASE_FILE__");
97   Ident__INCLUDE_LEVEL__ = RegisterBuiltinMacro(*this, "__INCLUDE_LEVEL__");
98   Ident__TIMESTAMP__     = RegisterBuiltinMacro(*this, "__TIMESTAMP__");
99 
100   // Clang Extensions.
101   Ident__has_feature      = RegisterBuiltinMacro(*this, "__has_feature");
102   Ident__has_extension    = RegisterBuiltinMacro(*this, "__has_extension");
103   Ident__has_builtin      = RegisterBuiltinMacro(*this, "__has_builtin");
104   Ident__has_attribute    = RegisterBuiltinMacro(*this, "__has_attribute");
105   Ident__has_include      = RegisterBuiltinMacro(*this, "__has_include");
106   Ident__has_include_next = RegisterBuiltinMacro(*this, "__has_include_next");
107   Ident__has_warning      = RegisterBuiltinMacro(*this, "__has_warning");
108 
109   // Modules.
110   if (LangOpts.Modules) {
111     Ident__building_module  = RegisterBuiltinMacro(*this, "__building_module");
112 
113     // __MODULE__
114     if (!LangOpts.CurrentModule.empty())
115       Ident__MODULE__ = RegisterBuiltinMacro(*this, "__MODULE__");
116     else
117       Ident__MODULE__ = 0;
118   } else {
119     Ident__building_module = 0;
120     Ident__MODULE__ = 0;
121   }
122 
123   // Microsoft Extensions.
124   if (LangOpts.MicrosoftExt)
125     Ident__pragma = RegisterBuiltinMacro(*this, "__pragma");
126   else
127     Ident__pragma = 0;
128 }
129 
130 /// isTrivialSingleTokenExpansion - Return true if MI, which has a single token
131 /// in its expansion, currently expands to that token literally.
isTrivialSingleTokenExpansion(const MacroInfo * MI,const IdentifierInfo * MacroIdent,Preprocessor & PP)132 static bool isTrivialSingleTokenExpansion(const MacroInfo *MI,
133                                           const IdentifierInfo *MacroIdent,
134                                           Preprocessor &PP) {
135   IdentifierInfo *II = MI->getReplacementToken(0).getIdentifierInfo();
136 
137   // If the token isn't an identifier, it's always literally expanded.
138   if (II == 0) return true;
139 
140   // If the information about this identifier is out of date, update it from
141   // the external source.
142   if (II->isOutOfDate())
143     PP.getExternalSource()->updateOutOfDateIdentifier(*II);
144 
145   // If the identifier is a macro, and if that macro is enabled, it may be
146   // expanded so it's not a trivial expansion.
147   if (II->hasMacroDefinition() && PP.getMacroInfo(II)->isEnabled() &&
148       // Fast expanding "#define X X" is ok, because X would be disabled.
149       II != MacroIdent)
150     return false;
151 
152   // If this is an object-like macro invocation, it is safe to trivially expand
153   // it.
154   if (MI->isObjectLike()) return true;
155 
156   // If this is a function-like macro invocation, it's safe to trivially expand
157   // as long as the identifier is not a macro argument.
158   for (MacroInfo::arg_iterator I = MI->arg_begin(), E = MI->arg_end();
159        I != E; ++I)
160     if (*I == II)
161       return false;   // Identifier is a macro argument.
162 
163   return true;
164 }
165 
166 
167 /// isNextPPTokenLParen - Determine whether the next preprocessor token to be
168 /// lexed is a '('.  If so, consume the token and return true, if not, this
169 /// method should have no observable side-effect on the lexed tokens.
isNextPPTokenLParen()170 bool Preprocessor::isNextPPTokenLParen() {
171   // Do some quick tests for rejection cases.
172   unsigned Val;
173   if (CurLexer)
174     Val = CurLexer->isNextPPTokenLParen();
175   else if (CurPTHLexer)
176     Val = CurPTHLexer->isNextPPTokenLParen();
177   else
178     Val = CurTokenLexer->isNextTokenLParen();
179 
180   if (Val == 2) {
181     // We have run off the end.  If it's a source file we don't
182     // examine enclosing ones (C99 5.1.1.2p4).  Otherwise walk up the
183     // macro stack.
184     if (CurPPLexer)
185       return false;
186     for (unsigned i = IncludeMacroStack.size(); i != 0; --i) {
187       IncludeStackInfo &Entry = IncludeMacroStack[i-1];
188       if (Entry.TheLexer)
189         Val = Entry.TheLexer->isNextPPTokenLParen();
190       else if (Entry.ThePTHLexer)
191         Val = Entry.ThePTHLexer->isNextPPTokenLParen();
192       else
193         Val = Entry.TheTokenLexer->isNextTokenLParen();
194 
195       if (Val != 2)
196         break;
197 
198       // Ran off the end of a source file?
199       if (Entry.ThePPLexer)
200         return false;
201     }
202   }
203 
204   // Okay, if we know that the token is a '(', lex it and return.  Otherwise we
205   // have found something that isn't a '(' or we found the end of the
206   // translation unit.  In either case, return false.
207   return Val == 1;
208 }
209 
210 /// HandleMacroExpandedIdentifier - If an identifier token is read that is to be
211 /// expanded as a macro, handle it and return the next token as 'Identifier'.
HandleMacroExpandedIdentifier(Token & Identifier,MacroDirective * MD)212 bool Preprocessor::HandleMacroExpandedIdentifier(Token &Identifier,
213                                                  MacroDirective *MD) {
214   MacroDirective::DefInfo Def = MD->getDefinition();
215   assert(Def.isValid());
216   MacroInfo *MI = Def.getMacroInfo();
217 
218   // If this is a macro expansion in the "#if !defined(x)" line for the file,
219   // then the macro could expand to different things in other contexts, we need
220   // to disable the optimization in this case.
221   if (CurPPLexer) CurPPLexer->MIOpt.ExpandedMacro();
222 
223   // If this is a builtin macro, like __LINE__ or _Pragma, handle it specially.
224   if (MI->isBuiltinMacro()) {
225     if (Callbacks) Callbacks->MacroExpands(Identifier, MD,
226                                            Identifier.getLocation(),/*Args=*/0);
227     ExpandBuiltinMacro(Identifier);
228     return false;
229   }
230 
231   /// Args - If this is a function-like macro expansion, this contains,
232   /// for each macro argument, the list of tokens that were provided to the
233   /// invocation.
234   MacroArgs *Args = 0;
235 
236   // Remember where the end of the expansion occurred.  For an object-like
237   // macro, this is the identifier.  For a function-like macro, this is the ')'.
238   SourceLocation ExpansionEnd = Identifier.getLocation();
239 
240   // If this is a function-like macro, read the arguments.
241   if (MI->isFunctionLike()) {
242     // C99 6.10.3p10: If the preprocessing token immediately after the macro
243     // name isn't a '(', this macro should not be expanded.
244     if (!isNextPPTokenLParen())
245       return true;
246 
247     // Remember that we are now parsing the arguments to a macro invocation.
248     // Preprocessor directives used inside macro arguments are not portable, and
249     // this enables the warning.
250     InMacroArgs = true;
251     Args = ReadFunctionLikeMacroArgs(Identifier, MI, ExpansionEnd);
252 
253     // Finished parsing args.
254     InMacroArgs = false;
255 
256     // If there was an error parsing the arguments, bail out.
257     if (Args == 0) return false;
258 
259     ++NumFnMacroExpanded;
260   } else {
261     ++NumMacroExpanded;
262   }
263 
264   // Notice that this macro has been used.
265   markMacroAsUsed(MI);
266 
267   // Remember where the token is expanded.
268   SourceLocation ExpandLoc = Identifier.getLocation();
269   SourceRange ExpansionRange(ExpandLoc, ExpansionEnd);
270 
271   if (Callbacks) {
272     if (InMacroArgs) {
273       // We can have macro expansion inside a conditional directive while
274       // reading the function macro arguments. To ensure, in that case, that
275       // MacroExpands callbacks still happen in source order, queue this
276       // callback to have it happen after the function macro callback.
277       DelayedMacroExpandsCallbacks.push_back(
278                               MacroExpandsInfo(Identifier, MD, ExpansionRange));
279     } else {
280       Callbacks->MacroExpands(Identifier, MD, ExpansionRange, Args);
281       if (!DelayedMacroExpandsCallbacks.empty()) {
282         for (unsigned i=0, e = DelayedMacroExpandsCallbacks.size(); i!=e; ++i) {
283           MacroExpandsInfo &Info = DelayedMacroExpandsCallbacks[i];
284           // FIXME: We lose macro args info with delayed callback.
285           Callbacks->MacroExpands(Info.Tok, Info.MD, Info.Range, /*Args=*/0);
286         }
287         DelayedMacroExpandsCallbacks.clear();
288       }
289     }
290   }
291 
292   // If the macro definition is ambiguous, complain.
293   if (Def.getDirective()->isAmbiguous()) {
294     Diag(Identifier, diag::warn_pp_ambiguous_macro)
295       << Identifier.getIdentifierInfo();
296     Diag(MI->getDefinitionLoc(), diag::note_pp_ambiguous_macro_chosen)
297       << Identifier.getIdentifierInfo();
298     for (MacroDirective::DefInfo PrevDef = Def.getPreviousDefinition();
299          PrevDef && !PrevDef.isUndefined();
300          PrevDef = PrevDef.getPreviousDefinition()) {
301       if (PrevDef.getDirective()->isAmbiguous()) {
302         Diag(PrevDef.getMacroInfo()->getDefinitionLoc(),
303              diag::note_pp_ambiguous_macro_other)
304           << Identifier.getIdentifierInfo();
305       }
306     }
307   }
308 
309   // If we started lexing a macro, enter the macro expansion body.
310 
311   // If this macro expands to no tokens, don't bother to push it onto the
312   // expansion stack, only to take it right back off.
313   if (MI->getNumTokens() == 0) {
314     // No need for arg info.
315     if (Args) Args->destroy(*this);
316 
317     // Ignore this macro use, just return the next token in the current
318     // buffer.
319     bool HadLeadingSpace = Identifier.hasLeadingSpace();
320     bool IsAtStartOfLine = Identifier.isAtStartOfLine();
321 
322     Lex(Identifier);
323 
324     // If the identifier isn't on some OTHER line, inherit the leading
325     // whitespace/first-on-a-line property of this token.  This handles
326     // stuff like "! XX," -> "! ," and "   XX," -> "    ,", when XX is
327     // empty.
328     if (!Identifier.isAtStartOfLine()) {
329       if (IsAtStartOfLine) Identifier.setFlag(Token::StartOfLine);
330       if (HadLeadingSpace) Identifier.setFlag(Token::LeadingSpace);
331     }
332     Identifier.setFlag(Token::LeadingEmptyMacro);
333     ++NumFastMacroExpanded;
334     return false;
335 
336   } else if (MI->getNumTokens() == 1 &&
337              isTrivialSingleTokenExpansion(MI, Identifier.getIdentifierInfo(),
338                                            *this)) {
339     // Otherwise, if this macro expands into a single trivially-expanded
340     // token: expand it now.  This handles common cases like
341     // "#define VAL 42".
342 
343     // No need for arg info.
344     if (Args) Args->destroy(*this);
345 
346     // Propagate the isAtStartOfLine/hasLeadingSpace markers of the macro
347     // identifier to the expanded token.
348     bool isAtStartOfLine = Identifier.isAtStartOfLine();
349     bool hasLeadingSpace = Identifier.hasLeadingSpace();
350 
351     // Replace the result token.
352     Identifier = MI->getReplacementToken(0);
353 
354     // Restore the StartOfLine/LeadingSpace markers.
355     Identifier.setFlagValue(Token::StartOfLine , isAtStartOfLine);
356     Identifier.setFlagValue(Token::LeadingSpace, hasLeadingSpace);
357 
358     // Update the tokens location to include both its expansion and physical
359     // locations.
360     SourceLocation Loc =
361       SourceMgr.createExpansionLoc(Identifier.getLocation(), ExpandLoc,
362                                    ExpansionEnd,Identifier.getLength());
363     Identifier.setLocation(Loc);
364 
365     // If this is a disabled macro or #define X X, we must mark the result as
366     // unexpandable.
367     if (IdentifierInfo *NewII = Identifier.getIdentifierInfo()) {
368       if (MacroInfo *NewMI = getMacroInfo(NewII))
369         if (!NewMI->isEnabled() || NewMI == MI) {
370           Identifier.setFlag(Token::DisableExpand);
371           // Don't warn for "#define X X" like "#define bool bool" from
372           // stdbool.h.
373           if (NewMI != MI || MI->isFunctionLike())
374             Diag(Identifier, diag::pp_disabled_macro_expansion);
375         }
376     }
377 
378     // Since this is not an identifier token, it can't be macro expanded, so
379     // we're done.
380     ++NumFastMacroExpanded;
381     return false;
382   }
383 
384   // Start expanding the macro.
385   EnterMacro(Identifier, ExpansionEnd, MI, Args);
386 
387   // Now that the macro is at the top of the include stack, ask the
388   // preprocessor to read the next token from it.
389   Lex(Identifier);
390   return false;
391 }
392 
393 enum Bracket {
394   Brace,
395   Paren
396 };
397 
398 /// CheckMatchedBrackets - Returns true if the braces and parentheses in the
399 /// token vector are properly nested.
CheckMatchedBrackets(const SmallVectorImpl<Token> & Tokens)400 static bool CheckMatchedBrackets(const SmallVectorImpl<Token> &Tokens) {
401   SmallVector<Bracket, 8> Brackets;
402   for (SmallVectorImpl<Token>::const_iterator I = Tokens.begin(),
403                                               E = Tokens.end();
404        I != E; ++I) {
405     if (I->is(tok::l_paren)) {
406       Brackets.push_back(Paren);
407     } else if (I->is(tok::r_paren)) {
408       if (Brackets.empty() || Brackets.back() == Brace)
409         return false;
410       Brackets.pop_back();
411     } else if (I->is(tok::l_brace)) {
412       Brackets.push_back(Brace);
413     } else if (I->is(tok::r_brace)) {
414       if (Brackets.empty() || Brackets.back() == Paren)
415         return false;
416       Brackets.pop_back();
417     }
418   }
419   if (!Brackets.empty())
420     return false;
421   return true;
422 }
423 
424 /// GenerateNewArgTokens - Returns true if OldTokens can be converted to a new
425 /// vector of tokens in NewTokens.  The new number of arguments will be placed
426 /// in NumArgs and the ranges which need to surrounded in parentheses will be
427 /// in ParenHints.
428 /// Returns false if the token stream cannot be changed.  If this is because
429 /// of an initializer list starting a macro argument, the range of those
430 /// initializer lists will be place in InitLists.
GenerateNewArgTokens(Preprocessor & PP,SmallVectorImpl<Token> & OldTokens,SmallVectorImpl<Token> & NewTokens,unsigned & NumArgs,SmallVectorImpl<SourceRange> & ParenHints,SmallVectorImpl<SourceRange> & InitLists)431 static bool GenerateNewArgTokens(Preprocessor &PP,
432                                  SmallVectorImpl<Token> &OldTokens,
433                                  SmallVectorImpl<Token> &NewTokens,
434                                  unsigned &NumArgs,
435                                  SmallVectorImpl<SourceRange> &ParenHints,
436                                  SmallVectorImpl<SourceRange> &InitLists) {
437   if (!CheckMatchedBrackets(OldTokens))
438     return false;
439 
440   // Once it is known that the brackets are matched, only a simple count of the
441   // braces is needed.
442   unsigned Braces = 0;
443 
444   // First token of a new macro argument.
445   SmallVectorImpl<Token>::iterator ArgStartIterator = OldTokens.begin();
446 
447   // First closing brace in a new macro argument.  Used to generate
448   // SourceRanges for InitLists.
449   SmallVectorImpl<Token>::iterator ClosingBrace = OldTokens.end();
450   NumArgs = 0;
451   Token TempToken;
452   // Set to true when a macro separator token is found inside a braced list.
453   // If true, the fixed argument spans multiple old arguments and ParenHints
454   // will be updated.
455   bool FoundSeparatorToken = false;
456   for (SmallVectorImpl<Token>::iterator I = OldTokens.begin(),
457                                         E = OldTokens.end();
458        I != E; ++I) {
459     if (I->is(tok::l_brace)) {
460       ++Braces;
461     } else if (I->is(tok::r_brace)) {
462       --Braces;
463       if (Braces == 0 && ClosingBrace == E && FoundSeparatorToken)
464         ClosingBrace = I;
465     } else if (I->is(tok::eof)) {
466       // EOF token is used to separate macro arguments
467       if (Braces != 0) {
468         // Assume comma separator is actually braced list separator and change
469         // it back to a comma.
470         FoundSeparatorToken = true;
471         I->setKind(tok::comma);
472         I->setLength(1);
473       } else { // Braces == 0
474         // Separator token still separates arguments.
475         ++NumArgs;
476 
477         // If the argument starts with a brace, it can't be fixed with
478         // parentheses.  A different diagnostic will be given.
479         if (FoundSeparatorToken && ArgStartIterator->is(tok::l_brace)) {
480           InitLists.push_back(
481               SourceRange(ArgStartIterator->getLocation(),
482                           PP.getLocForEndOfToken(ClosingBrace->getLocation())));
483           ClosingBrace = E;
484         }
485 
486         // Add left paren
487         if (FoundSeparatorToken) {
488           TempToken.startToken();
489           TempToken.setKind(tok::l_paren);
490           TempToken.setLocation(ArgStartIterator->getLocation());
491           TempToken.setLength(0);
492           NewTokens.push_back(TempToken);
493         }
494 
495         // Copy over argument tokens
496         NewTokens.insert(NewTokens.end(), ArgStartIterator, I);
497 
498         // Add right paren and store the paren locations in ParenHints
499         if (FoundSeparatorToken) {
500           SourceLocation Loc = PP.getLocForEndOfToken((I - 1)->getLocation());
501           TempToken.startToken();
502           TempToken.setKind(tok::r_paren);
503           TempToken.setLocation(Loc);
504           TempToken.setLength(0);
505           NewTokens.push_back(TempToken);
506           ParenHints.push_back(SourceRange(ArgStartIterator->getLocation(),
507                                            Loc));
508         }
509 
510         // Copy separator token
511         NewTokens.push_back(*I);
512 
513         // Reset values
514         ArgStartIterator = I + 1;
515         FoundSeparatorToken = false;
516       }
517     }
518   }
519 
520   return !ParenHints.empty() && InitLists.empty();
521 }
522 
523 /// ReadFunctionLikeMacroArgs - After reading "MACRO" and knowing that the next
524 /// token is the '(' of the macro, this method is invoked to read all of the
525 /// actual arguments specified for the macro invocation.  This returns null on
526 /// error.
ReadFunctionLikeMacroArgs(Token & MacroName,MacroInfo * MI,SourceLocation & MacroEnd)527 MacroArgs *Preprocessor::ReadFunctionLikeMacroArgs(Token &MacroName,
528                                                    MacroInfo *MI,
529                                                    SourceLocation &MacroEnd) {
530   // The number of fixed arguments to parse.
531   unsigned NumFixedArgsLeft = MI->getNumArgs();
532   bool isVariadic = MI->isVariadic();
533 
534   // Outer loop, while there are more arguments, keep reading them.
535   Token Tok;
536 
537   // Read arguments as unexpanded tokens.  This avoids issues, e.g., where
538   // an argument value in a macro could expand to ',' or '(' or ')'.
539   LexUnexpandedToken(Tok);
540   assert(Tok.is(tok::l_paren) && "Error computing l-paren-ness?");
541 
542   // ArgTokens - Build up a list of tokens that make up each argument.  Each
543   // argument is separated by an EOF token.  Use a SmallVector so we can avoid
544   // heap allocations in the common case.
545   SmallVector<Token, 64> ArgTokens;
546   bool ContainsCodeCompletionTok = false;
547 
548   SourceLocation TooManyArgsLoc;
549 
550   unsigned NumActuals = 0;
551   while (Tok.isNot(tok::r_paren)) {
552     if (ContainsCodeCompletionTok && (Tok.is(tok::eof) || Tok.is(tok::eod)))
553       break;
554 
555     assert((Tok.is(tok::l_paren) || Tok.is(tok::comma)) &&
556            "only expect argument separators here");
557 
558     unsigned ArgTokenStart = ArgTokens.size();
559     SourceLocation ArgStartLoc = Tok.getLocation();
560 
561     // C99 6.10.3p11: Keep track of the number of l_parens we have seen.  Note
562     // that we already consumed the first one.
563     unsigned NumParens = 0;
564 
565     while (1) {
566       // Read arguments as unexpanded tokens.  This avoids issues, e.g., where
567       // an argument value in a macro could expand to ',' or '(' or ')'.
568       LexUnexpandedToken(Tok);
569 
570       if (Tok.is(tok::eof) || Tok.is(tok::eod)) { // "#if f(<eof>" & "#if f(\n"
571         if (!ContainsCodeCompletionTok) {
572           Diag(MacroName, diag::err_unterm_macro_invoc);
573           Diag(MI->getDefinitionLoc(), diag::note_macro_here)
574             << MacroName.getIdentifierInfo();
575           // Do not lose the EOF/EOD.  Return it to the client.
576           MacroName = Tok;
577           return 0;
578         } else {
579           // Do not lose the EOF/EOD.
580           Token *Toks = new Token[1];
581           Toks[0] = Tok;
582           EnterTokenStream(Toks, 1, true, true);
583           break;
584         }
585       } else if (Tok.is(tok::r_paren)) {
586         // If we found the ) token, the macro arg list is done.
587         if (NumParens-- == 0) {
588           MacroEnd = Tok.getLocation();
589           break;
590         }
591       } else if (Tok.is(tok::l_paren)) {
592         ++NumParens;
593       } else if (Tok.is(tok::comma) && NumParens == 0 &&
594                  !(Tok.getFlags() & Token::IgnoredComma)) {
595         // In Microsoft-compatibility mode, single commas from nested macro
596         // expansions should not be considered as argument separators. We test
597         // for this with the IgnoredComma token flag above.
598 
599         // Comma ends this argument if there are more fixed arguments expected.
600         // However, if this is a variadic macro, and this is part of the
601         // variadic part, then the comma is just an argument token.
602         if (!isVariadic) break;
603         if (NumFixedArgsLeft > 1)
604           break;
605       } else if (Tok.is(tok::comment) && !KeepMacroComments) {
606         // If this is a comment token in the argument list and we're just in
607         // -C mode (not -CC mode), discard the comment.
608         continue;
609       } else if (Tok.getIdentifierInfo() != 0) {
610         // Reading macro arguments can cause macros that we are currently
611         // expanding from to be popped off the expansion stack.  Doing so causes
612         // them to be reenabled for expansion.  Here we record whether any
613         // identifiers we lex as macro arguments correspond to disabled macros.
614         // If so, we mark the token as noexpand.  This is a subtle aspect of
615         // C99 6.10.3.4p2.
616         if (MacroInfo *MI = getMacroInfo(Tok.getIdentifierInfo()))
617           if (!MI->isEnabled())
618             Tok.setFlag(Token::DisableExpand);
619       } else if (Tok.is(tok::code_completion)) {
620         ContainsCodeCompletionTok = true;
621         if (CodeComplete)
622           CodeComplete->CodeCompleteMacroArgument(MacroName.getIdentifierInfo(),
623                                                   MI, NumActuals);
624         // Don't mark that we reached the code-completion point because the
625         // parser is going to handle the token and there will be another
626         // code-completion callback.
627       }
628 
629       ArgTokens.push_back(Tok);
630     }
631 
632     // If this was an empty argument list foo(), don't add this as an empty
633     // argument.
634     if (ArgTokens.empty() && Tok.getKind() == tok::r_paren)
635       break;
636 
637     // If this is not a variadic macro, and too many args were specified, emit
638     // an error.
639     if (!isVariadic && NumFixedArgsLeft == 0 && TooManyArgsLoc.isInvalid()) {
640       if (ArgTokens.size() != ArgTokenStart)
641         TooManyArgsLoc = ArgTokens[ArgTokenStart].getLocation();
642       else
643         TooManyArgsLoc = ArgStartLoc;
644     }
645 
646     // Empty arguments are standard in C99 and C++0x, and are supported as an
647     // extension in other modes.
648     if (ArgTokens.size() == ArgTokenStart && !LangOpts.C99)
649       Diag(Tok, LangOpts.CPlusPlus11 ?
650            diag::warn_cxx98_compat_empty_fnmacro_arg :
651            diag::ext_empty_fnmacro_arg);
652 
653     // Add a marker EOF token to the end of the token list for this argument.
654     Token EOFTok;
655     EOFTok.startToken();
656     EOFTok.setKind(tok::eof);
657     EOFTok.setLocation(Tok.getLocation());
658     EOFTok.setLength(0);
659     ArgTokens.push_back(EOFTok);
660     ++NumActuals;
661     if (!ContainsCodeCompletionTok && NumFixedArgsLeft != 0)
662       --NumFixedArgsLeft;
663   }
664 
665   // Okay, we either found the r_paren.  Check to see if we parsed too few
666   // arguments.
667   unsigned MinArgsExpected = MI->getNumArgs();
668 
669   // If this is not a variadic macro, and too many args were specified, emit
670   // an error.
671   if (!isVariadic && NumActuals > MinArgsExpected &&
672       !ContainsCodeCompletionTok) {
673     // Emit the diagnostic at the macro name in case there is a missing ).
674     // Emitting it at the , could be far away from the macro name.
675     Diag(TooManyArgsLoc, diag::err_too_many_args_in_macro_invoc);
676     Diag(MI->getDefinitionLoc(), diag::note_macro_here)
677       << MacroName.getIdentifierInfo();
678 
679     // Commas from braced initializer lists will be treated as argument
680     // separators inside macros.  Attempt to correct for this with parentheses.
681     // TODO: See if this can be generalized to angle brackets for templates
682     // inside macro arguments.
683 
684     SmallVector<Token, 4> FixedArgTokens;
685     unsigned FixedNumArgs = 0;
686     SmallVector<SourceRange, 4> ParenHints, InitLists;
687     if (!GenerateNewArgTokens(*this, ArgTokens, FixedArgTokens, FixedNumArgs,
688                               ParenHints, InitLists)) {
689       if (!InitLists.empty()) {
690         DiagnosticBuilder DB =
691             Diag(MacroName,
692                  diag::note_init_list_at_beginning_of_macro_argument);
693         for (SmallVector<SourceRange, 4>::iterator
694                  Range = InitLists.begin(), RangeEnd = InitLists.end();
695                  Range != RangeEnd; ++Range) {
696           if (DB.hasMaxRanges())
697             break;
698           DB << *Range;
699         }
700       }
701       return 0;
702     }
703     if (FixedNumArgs != MinArgsExpected)
704       return 0;
705 
706     DiagnosticBuilder DB = Diag(MacroName, diag::note_suggest_parens_for_macro);
707     for (SmallVector<SourceRange, 4>::iterator
708              ParenLocation = ParenHints.begin(), ParenEnd = ParenHints.end();
709          ParenLocation != ParenEnd; ++ParenLocation) {
710       if (DB.hasMaxFixItHints())
711         break;
712       DB << FixItHint::CreateInsertion(ParenLocation->getBegin(), "(");
713       if (DB.hasMaxFixItHints())
714         break;
715       DB << FixItHint::CreateInsertion(ParenLocation->getEnd(), ")");
716     }
717     ArgTokens.swap(FixedArgTokens);
718     NumActuals = FixedNumArgs;
719   }
720 
721   // See MacroArgs instance var for description of this.
722   bool isVarargsElided = false;
723 
724   if (ContainsCodeCompletionTok) {
725     // Recover from not-fully-formed macro invocation during code-completion.
726     Token EOFTok;
727     EOFTok.startToken();
728     EOFTok.setKind(tok::eof);
729     EOFTok.setLocation(Tok.getLocation());
730     EOFTok.setLength(0);
731     for (; NumActuals < MinArgsExpected; ++NumActuals)
732       ArgTokens.push_back(EOFTok);
733   }
734 
735   if (NumActuals < MinArgsExpected) {
736     // There are several cases where too few arguments is ok, handle them now.
737     if (NumActuals == 0 && MinArgsExpected == 1) {
738       // #define A(X)  or  #define A(...)   ---> A()
739 
740       // If there is exactly one argument, and that argument is missing,
741       // then we have an empty "()" argument empty list.  This is fine, even if
742       // the macro expects one argument (the argument is just empty).
743       isVarargsElided = MI->isVariadic();
744     } else if (MI->isVariadic() &&
745                (NumActuals+1 == MinArgsExpected ||  // A(x, ...) -> A(X)
746                 (NumActuals == 0 && MinArgsExpected == 2))) {// A(x,...) -> A()
747       // Varargs where the named vararg parameter is missing: OK as extension.
748       //   #define A(x, ...)
749       //   A("blah")
750       //
751       // If the macro contains the comma pasting extension, the diagnostic
752       // is suppressed; we know we'll get another diagnostic later.
753       if (!MI->hasCommaPasting()) {
754         Diag(Tok, diag::ext_missing_varargs_arg);
755         Diag(MI->getDefinitionLoc(), diag::note_macro_here)
756           << MacroName.getIdentifierInfo();
757       }
758 
759       // Remember this occurred, allowing us to elide the comma when used for
760       // cases like:
761       //   #define A(x, foo...) blah(a, ## foo)
762       //   #define B(x, ...) blah(a, ## __VA_ARGS__)
763       //   #define C(...) blah(a, ## __VA_ARGS__)
764       //  A(x) B(x) C()
765       isVarargsElided = true;
766     } else if (!ContainsCodeCompletionTok) {
767       // Otherwise, emit the error.
768       Diag(Tok, diag::err_too_few_args_in_macro_invoc);
769       Diag(MI->getDefinitionLoc(), diag::note_macro_here)
770         << MacroName.getIdentifierInfo();
771       return 0;
772     }
773 
774     // Add a marker EOF token to the end of the token list for this argument.
775     SourceLocation EndLoc = Tok.getLocation();
776     Tok.startToken();
777     Tok.setKind(tok::eof);
778     Tok.setLocation(EndLoc);
779     Tok.setLength(0);
780     ArgTokens.push_back(Tok);
781 
782     // If we expect two arguments, add both as empty.
783     if (NumActuals == 0 && MinArgsExpected == 2)
784       ArgTokens.push_back(Tok);
785 
786   } else if (NumActuals > MinArgsExpected && !MI->isVariadic() &&
787              !ContainsCodeCompletionTok) {
788     // Emit the diagnostic at the macro name in case there is a missing ).
789     // Emitting it at the , could be far away from the macro name.
790     Diag(MacroName, diag::err_too_many_args_in_macro_invoc);
791     Diag(MI->getDefinitionLoc(), diag::note_macro_here)
792       << MacroName.getIdentifierInfo();
793     return 0;
794   }
795 
796   return MacroArgs::create(MI, ArgTokens, isVarargsElided, *this);
797 }
798 
799 /// \brief Keeps macro expanded tokens for TokenLexers.
800 //
801 /// Works like a stack; a TokenLexer adds the macro expanded tokens that is
802 /// going to lex in the cache and when it finishes the tokens are removed
803 /// from the end of the cache.
cacheMacroExpandedTokens(TokenLexer * tokLexer,ArrayRef<Token> tokens)804 Token *Preprocessor::cacheMacroExpandedTokens(TokenLexer *tokLexer,
805                                               ArrayRef<Token> tokens) {
806   assert(tokLexer);
807   if (tokens.empty())
808     return 0;
809 
810   size_t newIndex = MacroExpandedTokens.size();
811   bool cacheNeedsToGrow = tokens.size() >
812                       MacroExpandedTokens.capacity()-MacroExpandedTokens.size();
813   MacroExpandedTokens.append(tokens.begin(), tokens.end());
814 
815   if (cacheNeedsToGrow) {
816     // Go through all the TokenLexers whose 'Tokens' pointer points in the
817     // buffer and update the pointers to the (potential) new buffer array.
818     for (unsigned i = 0, e = MacroExpandingLexersStack.size(); i != e; ++i) {
819       TokenLexer *prevLexer;
820       size_t tokIndex;
821       llvm::tie(prevLexer, tokIndex) = MacroExpandingLexersStack[i];
822       prevLexer->Tokens = MacroExpandedTokens.data() + tokIndex;
823     }
824   }
825 
826   MacroExpandingLexersStack.push_back(std::make_pair(tokLexer, newIndex));
827   return MacroExpandedTokens.data() + newIndex;
828 }
829 
removeCachedMacroExpandedTokensOfLastLexer()830 void Preprocessor::removeCachedMacroExpandedTokensOfLastLexer() {
831   assert(!MacroExpandingLexersStack.empty());
832   size_t tokIndex = MacroExpandingLexersStack.back().second;
833   assert(tokIndex < MacroExpandedTokens.size());
834   // Pop the cached macro expanded tokens from the end.
835   MacroExpandedTokens.resize(tokIndex);
836   MacroExpandingLexersStack.pop_back();
837 }
838 
839 /// ComputeDATE_TIME - Compute the current time, enter it into the specified
840 /// scratch buffer, then return DATELoc/TIMELoc locations with the position of
841 /// the identifier tokens inserted.
ComputeDATE_TIME(SourceLocation & DATELoc,SourceLocation & TIMELoc,Preprocessor & PP)842 static void ComputeDATE_TIME(SourceLocation &DATELoc, SourceLocation &TIMELoc,
843                              Preprocessor &PP) {
844   time_t TT = time(0);
845   struct tm *TM = localtime(&TT);
846 
847   static const char * const Months[] = {
848     "Jan","Feb","Mar","Apr","May","Jun","Jul","Aug","Sep","Oct","Nov","Dec"
849   };
850 
851   {
852     SmallString<32> TmpBuffer;
853     llvm::raw_svector_ostream TmpStream(TmpBuffer);
854     TmpStream << llvm::format("\"%s %2d %4d\"", Months[TM->tm_mon],
855                               TM->tm_mday, TM->tm_year + 1900);
856     Token TmpTok;
857     TmpTok.startToken();
858     PP.CreateString(TmpStream.str(), TmpTok);
859     DATELoc = TmpTok.getLocation();
860   }
861 
862   {
863     SmallString<32> TmpBuffer;
864     llvm::raw_svector_ostream TmpStream(TmpBuffer);
865     TmpStream << llvm::format("\"%02d:%02d:%02d\"",
866                               TM->tm_hour, TM->tm_min, TM->tm_sec);
867     Token TmpTok;
868     TmpTok.startToken();
869     PP.CreateString(TmpStream.str(), TmpTok);
870     TIMELoc = TmpTok.getLocation();
871   }
872 }
873 
874 
875 /// HasFeature - Return true if we recognize and implement the feature
876 /// specified by the identifier as a standard language feature.
HasFeature(const Preprocessor & PP,const IdentifierInfo * II)877 static bool HasFeature(const Preprocessor &PP, const IdentifierInfo *II) {
878   const LangOptions &LangOpts = PP.getLangOpts();
879   StringRef Feature = II->getName();
880 
881   // Normalize the feature name, __foo__ becomes foo.
882   if (Feature.startswith("__") && Feature.endswith("__") && Feature.size() >= 4)
883     Feature = Feature.substr(2, Feature.size() - 4);
884 
885   return llvm::StringSwitch<bool>(Feature)
886            .Case("address_sanitizer", LangOpts.Sanitize.Address)
887            .Case("attribute_analyzer_noreturn", true)
888            .Case("attribute_availability", true)
889            .Case("attribute_availability_with_message", true)
890            .Case("attribute_cf_returns_not_retained", true)
891            .Case("attribute_cf_returns_retained", true)
892            .Case("attribute_deprecated_with_message", true)
893            .Case("attribute_ext_vector_type", true)
894            .Case("attribute_ns_returns_not_retained", true)
895            .Case("attribute_ns_returns_retained", true)
896            .Case("attribute_ns_consumes_self", true)
897            .Case("attribute_ns_consumed", true)
898            .Case("attribute_cf_consumed", true)
899            .Case("attribute_objc_ivar_unused", true)
900            .Case("attribute_objc_method_family", true)
901            .Case("attribute_overloadable", true)
902            .Case("attribute_unavailable_with_message", true)
903            .Case("attribute_unused_on_fields", true)
904            .Case("blocks", LangOpts.Blocks)
905            .Case("c_thread_safety_attributes", true)
906            .Case("cxx_exceptions", LangOpts.Exceptions)
907            .Case("cxx_rtti", LangOpts.RTTI)
908            .Case("enumerator_attributes", true)
909            .Case("memory_sanitizer", LangOpts.Sanitize.Memory)
910            .Case("thread_sanitizer", LangOpts.Sanitize.Thread)
911            // Objective-C features
912            .Case("objc_arr", LangOpts.ObjCAutoRefCount) // FIXME: REMOVE?
913            .Case("objc_arc", LangOpts.ObjCAutoRefCount)
914            .Case("objc_arc_weak", LangOpts.ObjCARCWeak)
915            .Case("objc_default_synthesize_properties", LangOpts.ObjC2)
916            .Case("objc_fixed_enum", LangOpts.ObjC2)
917            .Case("objc_instancetype", LangOpts.ObjC2)
918            .Case("objc_modules", LangOpts.ObjC2 && LangOpts.Modules)
919            .Case("objc_nonfragile_abi", LangOpts.ObjCRuntime.isNonFragile())
920            .Case("objc_property_explicit_atomic", true) // Does clang support explicit "atomic" keyword?
921            .Case("objc_weak_class", LangOpts.ObjCRuntime.hasWeakClassImport())
922            .Case("objc_msg_lookup_stret", LangOpts.ObjCRuntime.getKind() == ObjCRuntime::ObjFW)
923            .Case("ownership_holds", true)
924            .Case("ownership_returns", true)
925            .Case("ownership_takes", true)
926            .Case("objc_bool", true)
927            .Case("objc_subscripting", LangOpts.ObjCRuntime.isNonFragile())
928            .Case("objc_array_literals", LangOpts.ObjC2)
929            .Case("objc_dictionary_literals", LangOpts.ObjC2)
930            .Case("objc_boxed_expressions", LangOpts.ObjC2)
931            .Case("arc_cf_code_audited", true)
932            // C11 features
933            .Case("c_alignas", LangOpts.C11)
934            .Case("c_atomic", LangOpts.C11)
935            .Case("c_generic_selections", LangOpts.C11)
936            .Case("c_static_assert", LangOpts.C11)
937            .Case("c_thread_local",
938                  LangOpts.C11 && PP.getTargetInfo().isTLSSupported())
939            // C++11 features
940            .Case("cxx_access_control_sfinae", LangOpts.CPlusPlus11)
941            .Case("cxx_alias_templates", LangOpts.CPlusPlus11)
942            .Case("cxx_alignas", LangOpts.CPlusPlus11)
943            .Case("cxx_atomic", LangOpts.CPlusPlus11)
944            .Case("cxx_attributes", LangOpts.CPlusPlus11)
945            .Case("cxx_auto_type", LangOpts.CPlusPlus11)
946            .Case("cxx_constexpr", LangOpts.CPlusPlus11)
947            .Case("cxx_decltype", LangOpts.CPlusPlus11)
948            .Case("cxx_decltype_incomplete_return_types", LangOpts.CPlusPlus11)
949            .Case("cxx_default_function_template_args", LangOpts.CPlusPlus11)
950            .Case("cxx_defaulted_functions", LangOpts.CPlusPlus11)
951            .Case("cxx_delegating_constructors", LangOpts.CPlusPlus11)
952            .Case("cxx_deleted_functions", LangOpts.CPlusPlus11)
953            .Case("cxx_explicit_conversions", LangOpts.CPlusPlus11)
954            .Case("cxx_generalized_initializers", LangOpts.CPlusPlus11)
955            .Case("cxx_implicit_moves", LangOpts.CPlusPlus11)
956            .Case("cxx_inheriting_constructors", LangOpts.CPlusPlus11)
957            .Case("cxx_inline_namespaces", LangOpts.CPlusPlus11)
958            .Case("cxx_lambdas", LangOpts.CPlusPlus11)
959            .Case("cxx_local_type_template_args", LangOpts.CPlusPlus11)
960            .Case("cxx_nonstatic_member_init", LangOpts.CPlusPlus11)
961            .Case("cxx_noexcept", LangOpts.CPlusPlus11)
962            .Case("cxx_nullptr", LangOpts.CPlusPlus11)
963            .Case("cxx_override_control", LangOpts.CPlusPlus11)
964            .Case("cxx_range_for", LangOpts.CPlusPlus11)
965            .Case("cxx_raw_string_literals", LangOpts.CPlusPlus11)
966            .Case("cxx_reference_qualified_functions", LangOpts.CPlusPlus11)
967            .Case("cxx_rvalue_references", LangOpts.CPlusPlus11)
968            .Case("cxx_strong_enums", LangOpts.CPlusPlus11)
969            .Case("cxx_static_assert", LangOpts.CPlusPlus11)
970            .Case("cxx_thread_local",
971                  LangOpts.CPlusPlus11 && PP.getTargetInfo().isTLSSupported())
972            .Case("cxx_trailing_return", LangOpts.CPlusPlus11)
973            .Case("cxx_unicode_literals", LangOpts.CPlusPlus11)
974            .Case("cxx_unrestricted_unions", LangOpts.CPlusPlus11)
975            .Case("cxx_user_literals", LangOpts.CPlusPlus11)
976            .Case("cxx_variadic_templates", LangOpts.CPlusPlus11)
977            // C++1y features
978            .Case("cxx_aggregate_nsdmi", LangOpts.CPlusPlus1y)
979            .Case("cxx_binary_literals", LangOpts.CPlusPlus1y)
980            .Case("cxx_contextual_conversions", LangOpts.CPlusPlus1y)
981            //.Case("cxx_generic_lambda", LangOpts.CPlusPlus1y)
982            //.Case("cxx_init_capture", LangOpts.CPlusPlus1y)
983            .Case("cxx_relaxed_constexpr", LangOpts.CPlusPlus1y)
984            .Case("cxx_return_type_deduction", LangOpts.CPlusPlus1y)
985            //.Case("cxx_runtime_array", LangOpts.CPlusPlus1y)
986            //.Case("cxx_variable_templates", LangOpts.CPlusPlus1y)
987            // Type traits
988            .Case("has_nothrow_assign", LangOpts.CPlusPlus)
989            .Case("has_nothrow_copy", LangOpts.CPlusPlus)
990            .Case("has_nothrow_constructor", LangOpts.CPlusPlus)
991            .Case("has_trivial_assign", LangOpts.CPlusPlus)
992            .Case("has_trivial_copy", LangOpts.CPlusPlus)
993            .Case("has_trivial_constructor", LangOpts.CPlusPlus)
994            .Case("has_trivial_destructor", LangOpts.CPlusPlus)
995            .Case("has_virtual_destructor", LangOpts.CPlusPlus)
996            .Case("is_abstract", LangOpts.CPlusPlus)
997            .Case("is_base_of", LangOpts.CPlusPlus)
998            .Case("is_class", LangOpts.CPlusPlus)
999            .Case("is_convertible_to", LangOpts.CPlusPlus)
1000            .Case("is_empty", LangOpts.CPlusPlus)
1001            .Case("is_enum", LangOpts.CPlusPlus)
1002            .Case("is_final", LangOpts.CPlusPlus)
1003            .Case("is_literal", LangOpts.CPlusPlus)
1004            .Case("is_standard_layout", LangOpts.CPlusPlus)
1005            .Case("is_pod", LangOpts.CPlusPlus)
1006            .Case("is_polymorphic", LangOpts.CPlusPlus)
1007            .Case("is_trivial", LangOpts.CPlusPlus)
1008            .Case("is_trivially_assignable", LangOpts.CPlusPlus)
1009            .Case("is_trivially_constructible", LangOpts.CPlusPlus)
1010            .Case("is_trivially_copyable", LangOpts.CPlusPlus)
1011            .Case("is_union", LangOpts.CPlusPlus)
1012            .Case("modules", LangOpts.Modules)
1013            .Case("tls", PP.getTargetInfo().isTLSSupported())
1014            .Case("underlying_type", LangOpts.CPlusPlus)
1015            .Default(false);
1016 }
1017 
1018 /// HasExtension - Return true if we recognize and implement the feature
1019 /// specified by the identifier, either as an extension or a standard language
1020 /// feature.
HasExtension(const Preprocessor & PP,const IdentifierInfo * II)1021 static bool HasExtension(const Preprocessor &PP, const IdentifierInfo *II) {
1022   if (HasFeature(PP, II))
1023     return true;
1024 
1025   // If the use of an extension results in an error diagnostic, extensions are
1026   // effectively unavailable, so just return false here.
1027   if (PP.getDiagnostics().getExtensionHandlingBehavior() ==
1028       DiagnosticsEngine::Ext_Error)
1029     return false;
1030 
1031   const LangOptions &LangOpts = PP.getLangOpts();
1032   StringRef Extension = II->getName();
1033 
1034   // Normalize the extension name, __foo__ becomes foo.
1035   if (Extension.startswith("__") && Extension.endswith("__") &&
1036       Extension.size() >= 4)
1037     Extension = Extension.substr(2, Extension.size() - 4);
1038 
1039   // Because we inherit the feature list from HasFeature, this string switch
1040   // must be less restrictive than HasFeature's.
1041   return llvm::StringSwitch<bool>(Extension)
1042            // C11 features supported by other languages as extensions.
1043            .Case("c_alignas", true)
1044            .Case("c_atomic", true)
1045            .Case("c_generic_selections", true)
1046            .Case("c_static_assert", true)
1047            // C++11 features supported by other languages as extensions.
1048            .Case("cxx_atomic", LangOpts.CPlusPlus)
1049            .Case("cxx_deleted_functions", LangOpts.CPlusPlus)
1050            .Case("cxx_explicit_conversions", LangOpts.CPlusPlus)
1051            .Case("cxx_inline_namespaces", LangOpts.CPlusPlus)
1052            .Case("cxx_local_type_template_args", LangOpts.CPlusPlus)
1053            .Case("cxx_nonstatic_member_init", LangOpts.CPlusPlus)
1054            .Case("cxx_override_control", LangOpts.CPlusPlus)
1055            .Case("cxx_range_for", LangOpts.CPlusPlus)
1056            .Case("cxx_reference_qualified_functions", LangOpts.CPlusPlus)
1057            .Case("cxx_rvalue_references", LangOpts.CPlusPlus)
1058            // C++1y features supported by other languages as extensions.
1059            .Case("cxx_binary_literals", true)
1060            .Default(false);
1061 }
1062 
1063 /// HasAttribute -  Return true if we recognize and implement the attribute
1064 /// specified by the given identifier.
HasAttribute(const IdentifierInfo * II)1065 static bool HasAttribute(const IdentifierInfo *II) {
1066   StringRef Name = II->getName();
1067   // Normalize the attribute name, __foo__ becomes foo.
1068   if (Name.startswith("__") && Name.endswith("__") && Name.size() >= 4)
1069     Name = Name.substr(2, Name.size() - 4);
1070 
1071   // FIXME: Do we need to handle namespaces here?
1072   return llvm::StringSwitch<bool>(Name)
1073 #include "clang/Lex/AttrSpellings.inc"
1074         .Default(false);
1075 }
1076 
1077 /// EvaluateHasIncludeCommon - Process a '__has_include("path")'
1078 /// or '__has_include_next("path")' expression.
1079 /// Returns true if successful.
EvaluateHasIncludeCommon(Token & Tok,IdentifierInfo * II,Preprocessor & PP,const DirectoryLookup * LookupFrom)1080 static bool EvaluateHasIncludeCommon(Token &Tok,
1081                                      IdentifierInfo *II, Preprocessor &PP,
1082                                      const DirectoryLookup *LookupFrom) {
1083   // Save the location of the current token.  If a '(' is later found, use
1084   // that location.  If not, use the end of this location instead.
1085   SourceLocation LParenLoc = Tok.getLocation();
1086 
1087   // These expressions are only allowed within a preprocessor directive.
1088   if (!PP.isParsingIfOrElifDirective()) {
1089     PP.Diag(LParenLoc, diag::err_pp_directive_required) << II->getName();
1090     return false;
1091   }
1092 
1093   // Get '('.
1094   PP.LexNonComment(Tok);
1095 
1096   // Ensure we have a '('.
1097   if (Tok.isNot(tok::l_paren)) {
1098     // No '(', use end of last token.
1099     LParenLoc = PP.getLocForEndOfToken(LParenLoc);
1100     PP.Diag(LParenLoc, diag::err_pp_missing_lparen) << II->getName();
1101     // If the next token looks like a filename or the start of one,
1102     // assume it is and process it as such.
1103     if (!Tok.is(tok::angle_string_literal) && !Tok.is(tok::string_literal) &&
1104         !Tok.is(tok::less))
1105       return false;
1106   } else {
1107     // Save '(' location for possible missing ')' message.
1108     LParenLoc = Tok.getLocation();
1109 
1110     if (PP.getCurrentLexer()) {
1111       // Get the file name.
1112       PP.getCurrentLexer()->LexIncludeFilename(Tok);
1113     } else {
1114       // We're in a macro, so we can't use LexIncludeFilename; just
1115       // grab the next token.
1116       PP.Lex(Tok);
1117     }
1118   }
1119 
1120   // Reserve a buffer to get the spelling.
1121   SmallString<128> FilenameBuffer;
1122   StringRef Filename;
1123   SourceLocation EndLoc;
1124 
1125   switch (Tok.getKind()) {
1126   case tok::eod:
1127     // If the token kind is EOD, the error has already been diagnosed.
1128     return false;
1129 
1130   case tok::angle_string_literal:
1131   case tok::string_literal: {
1132     bool Invalid = false;
1133     Filename = PP.getSpelling(Tok, FilenameBuffer, &Invalid);
1134     if (Invalid)
1135       return false;
1136     break;
1137   }
1138 
1139   case tok::less:
1140     // This could be a <foo/bar.h> file coming from a macro expansion.  In this
1141     // case, glue the tokens together into FilenameBuffer and interpret those.
1142     FilenameBuffer.push_back('<');
1143     if (PP.ConcatenateIncludeName(FilenameBuffer, EndLoc)) {
1144       // Let the caller know a <eod> was found by changing the Token kind.
1145       Tok.setKind(tok::eod);
1146       return false;   // Found <eod> but no ">"?  Diagnostic already emitted.
1147     }
1148     Filename = FilenameBuffer.str();
1149     break;
1150   default:
1151     PP.Diag(Tok.getLocation(), diag::err_pp_expects_filename);
1152     return false;
1153   }
1154 
1155   SourceLocation FilenameLoc = Tok.getLocation();
1156 
1157   // Get ')'.
1158   PP.LexNonComment(Tok);
1159 
1160   // Ensure we have a trailing ).
1161   if (Tok.isNot(tok::r_paren)) {
1162     PP.Diag(PP.getLocForEndOfToken(FilenameLoc), diag::err_pp_missing_rparen)
1163         << II->getName();
1164     PP.Diag(LParenLoc, diag::note_matching) << "(";
1165     return false;
1166   }
1167 
1168   bool isAngled = PP.GetIncludeFilenameSpelling(Tok.getLocation(), Filename);
1169   // If GetIncludeFilenameSpelling set the start ptr to null, there was an
1170   // error.
1171   if (Filename.empty())
1172     return false;
1173 
1174   // Search include directories.
1175   const DirectoryLookup *CurDir;
1176   const FileEntry *File =
1177       PP.LookupFile(FilenameLoc, Filename, isAngled, LookupFrom, CurDir, NULL,
1178                     NULL, NULL);
1179 
1180   // Get the result value.  A result of true means the file exists.
1181   return File != 0;
1182 }
1183 
1184 /// EvaluateHasInclude - Process a '__has_include("path")' expression.
1185 /// Returns true if successful.
EvaluateHasInclude(Token & Tok,IdentifierInfo * II,Preprocessor & PP)1186 static bool EvaluateHasInclude(Token &Tok, IdentifierInfo *II,
1187                                Preprocessor &PP) {
1188   return EvaluateHasIncludeCommon(Tok, II, PP, NULL);
1189 }
1190 
1191 /// EvaluateHasIncludeNext - Process '__has_include_next("path")' expression.
1192 /// Returns true if successful.
EvaluateHasIncludeNext(Token & Tok,IdentifierInfo * II,Preprocessor & PP)1193 static bool EvaluateHasIncludeNext(Token &Tok,
1194                                    IdentifierInfo *II, Preprocessor &PP) {
1195   // __has_include_next is like __has_include, except that we start
1196   // searching after the current found directory.  If we can't do this,
1197   // issue a diagnostic.
1198   const DirectoryLookup *Lookup = PP.GetCurDirLookup();
1199   if (PP.isInPrimaryFile()) {
1200     Lookup = 0;
1201     PP.Diag(Tok, diag::pp_include_next_in_primary);
1202   } else if (Lookup == 0) {
1203     PP.Diag(Tok, diag::pp_include_next_absolute_path);
1204   } else {
1205     // Start looking up in the next directory.
1206     ++Lookup;
1207   }
1208 
1209   return EvaluateHasIncludeCommon(Tok, II, PP, Lookup);
1210 }
1211 
1212 /// \brief Process __building_module(identifier) expression.
1213 /// \returns true if we are building the named module, false otherwise.
EvaluateBuildingModule(Token & Tok,IdentifierInfo * II,Preprocessor & PP)1214 static bool EvaluateBuildingModule(Token &Tok,
1215                                    IdentifierInfo *II, Preprocessor &PP) {
1216   // Get '('.
1217   PP.LexNonComment(Tok);
1218 
1219   // Ensure we have a '('.
1220   if (Tok.isNot(tok::l_paren)) {
1221     PP.Diag(Tok.getLocation(), diag::err_pp_missing_lparen) << II->getName();
1222     return false;
1223   }
1224 
1225   // Save '(' location for possible missing ')' message.
1226   SourceLocation LParenLoc = Tok.getLocation();
1227 
1228   // Get the module name.
1229   PP.LexNonComment(Tok);
1230 
1231   // Ensure that we have an identifier.
1232   if (Tok.isNot(tok::identifier)) {
1233     PP.Diag(Tok.getLocation(), diag::err_expected_id_building_module);
1234     return false;
1235   }
1236 
1237   bool Result
1238     = Tok.getIdentifierInfo()->getName() == PP.getLangOpts().CurrentModule;
1239 
1240   // Get ')'.
1241   PP.LexNonComment(Tok);
1242 
1243   // Ensure we have a trailing ).
1244   if (Tok.isNot(tok::r_paren)) {
1245     PP.Diag(Tok.getLocation(), diag::err_pp_missing_rparen) << II->getName();
1246     PP.Diag(LParenLoc, diag::note_matching) << "(";
1247     return false;
1248   }
1249 
1250   return Result;
1251 }
1252 
1253 /// ExpandBuiltinMacro - If an identifier token is read that is to be expanded
1254 /// as a builtin macro, handle it and return the next token as 'Tok'.
ExpandBuiltinMacro(Token & Tok)1255 void Preprocessor::ExpandBuiltinMacro(Token &Tok) {
1256   // Figure out which token this is.
1257   IdentifierInfo *II = Tok.getIdentifierInfo();
1258   assert(II && "Can't be a macro without id info!");
1259 
1260   // If this is an _Pragma or Microsoft __pragma directive, expand it,
1261   // invoke the pragma handler, then lex the token after it.
1262   if (II == Ident_Pragma)
1263     return Handle_Pragma(Tok);
1264   else if (II == Ident__pragma) // in non-MS mode this is null
1265     return HandleMicrosoft__pragma(Tok);
1266 
1267   ++NumBuiltinMacroExpanded;
1268 
1269   SmallString<128> TmpBuffer;
1270   llvm::raw_svector_ostream OS(TmpBuffer);
1271 
1272   // Set up the return result.
1273   Tok.setIdentifierInfo(0);
1274   Tok.clearFlag(Token::NeedsCleaning);
1275 
1276   if (II == Ident__LINE__) {
1277     // C99 6.10.8: "__LINE__: The presumed line number (within the current
1278     // source file) of the current source line (an integer constant)".  This can
1279     // be affected by #line.
1280     SourceLocation Loc = Tok.getLocation();
1281 
1282     // Advance to the location of the first _, this might not be the first byte
1283     // of the token if it starts with an escaped newline.
1284     Loc = AdvanceToTokenCharacter(Loc, 0);
1285 
1286     // One wrinkle here is that GCC expands __LINE__ to location of the *end* of
1287     // a macro expansion.  This doesn't matter for object-like macros, but
1288     // can matter for a function-like macro that expands to contain __LINE__.
1289     // Skip down through expansion points until we find a file loc for the
1290     // end of the expansion history.
1291     Loc = SourceMgr.getExpansionRange(Loc).second;
1292     PresumedLoc PLoc = SourceMgr.getPresumedLoc(Loc);
1293 
1294     // __LINE__ expands to a simple numeric value.
1295     OS << (PLoc.isValid()? PLoc.getLine() : 1);
1296     Tok.setKind(tok::numeric_constant);
1297   } else if (II == Ident__FILE__ || II == Ident__BASE_FILE__) {
1298     // C99 6.10.8: "__FILE__: The presumed name of the current source file (a
1299     // character string literal)". This can be affected by #line.
1300     PresumedLoc PLoc = SourceMgr.getPresumedLoc(Tok.getLocation());
1301 
1302     // __BASE_FILE__ is a GNU extension that returns the top of the presumed
1303     // #include stack instead of the current file.
1304     if (II == Ident__BASE_FILE__ && PLoc.isValid()) {
1305       SourceLocation NextLoc = PLoc.getIncludeLoc();
1306       while (NextLoc.isValid()) {
1307         PLoc = SourceMgr.getPresumedLoc(NextLoc);
1308         if (PLoc.isInvalid())
1309           break;
1310 
1311         NextLoc = PLoc.getIncludeLoc();
1312       }
1313     }
1314 
1315     // Escape this filename.  Turn '\' -> '\\' '"' -> '\"'
1316     SmallString<128> FN;
1317     if (PLoc.isValid()) {
1318       FN += PLoc.getFilename();
1319       Lexer::Stringify(FN);
1320       OS << '"' << FN.str() << '"';
1321     }
1322     Tok.setKind(tok::string_literal);
1323   } else if (II == Ident__DATE__) {
1324     if (!DATELoc.isValid())
1325       ComputeDATE_TIME(DATELoc, TIMELoc, *this);
1326     Tok.setKind(tok::string_literal);
1327     Tok.setLength(strlen("\"Mmm dd yyyy\""));
1328     Tok.setLocation(SourceMgr.createExpansionLoc(DATELoc, Tok.getLocation(),
1329                                                  Tok.getLocation(),
1330                                                  Tok.getLength()));
1331     return;
1332   } else if (II == Ident__TIME__) {
1333     if (!TIMELoc.isValid())
1334       ComputeDATE_TIME(DATELoc, TIMELoc, *this);
1335     Tok.setKind(tok::string_literal);
1336     Tok.setLength(strlen("\"hh:mm:ss\""));
1337     Tok.setLocation(SourceMgr.createExpansionLoc(TIMELoc, Tok.getLocation(),
1338                                                  Tok.getLocation(),
1339                                                  Tok.getLength()));
1340     return;
1341   } else if (II == Ident__INCLUDE_LEVEL__) {
1342     // Compute the presumed include depth of this token.  This can be affected
1343     // by GNU line markers.
1344     unsigned Depth = 0;
1345 
1346     PresumedLoc PLoc = SourceMgr.getPresumedLoc(Tok.getLocation());
1347     if (PLoc.isValid()) {
1348       PLoc = SourceMgr.getPresumedLoc(PLoc.getIncludeLoc());
1349       for (; PLoc.isValid(); ++Depth)
1350         PLoc = SourceMgr.getPresumedLoc(PLoc.getIncludeLoc());
1351     }
1352 
1353     // __INCLUDE_LEVEL__ expands to a simple numeric value.
1354     OS << Depth;
1355     Tok.setKind(tok::numeric_constant);
1356   } else if (II == Ident__TIMESTAMP__) {
1357     // MSVC, ICC, GCC, VisualAge C++ extension.  The generated string should be
1358     // of the form "Ddd Mmm dd hh::mm::ss yyyy", which is returned by asctime.
1359 
1360     // Get the file that we are lexing out of.  If we're currently lexing from
1361     // a macro, dig into the include stack.
1362     const FileEntry *CurFile = 0;
1363     PreprocessorLexer *TheLexer = getCurrentFileLexer();
1364 
1365     if (TheLexer)
1366       CurFile = SourceMgr.getFileEntryForID(TheLexer->getFileID());
1367 
1368     const char *Result;
1369     if (CurFile) {
1370       time_t TT = CurFile->getModificationTime();
1371       struct tm *TM = localtime(&TT);
1372       Result = asctime(TM);
1373     } else {
1374       Result = "??? ??? ?? ??:??:?? ????\n";
1375     }
1376     // Surround the string with " and strip the trailing newline.
1377     OS << '"' << StringRef(Result, strlen(Result)-1) << '"';
1378     Tok.setKind(tok::string_literal);
1379   } else if (II == Ident__COUNTER__) {
1380     // __COUNTER__ expands to a simple numeric value.
1381     OS << CounterValue++;
1382     Tok.setKind(tok::numeric_constant);
1383   } else if (II == Ident__has_feature   ||
1384              II == Ident__has_extension ||
1385              II == Ident__has_builtin   ||
1386              II == Ident__has_attribute) {
1387     // The argument to these builtins should be a parenthesized identifier.
1388     SourceLocation StartLoc = Tok.getLocation();
1389 
1390     bool IsValid = false;
1391     IdentifierInfo *FeatureII = 0;
1392 
1393     // Read the '('.
1394     LexUnexpandedToken(Tok);
1395     if (Tok.is(tok::l_paren)) {
1396       // Read the identifier
1397       LexUnexpandedToken(Tok);
1398       if ((FeatureII = Tok.getIdentifierInfo())) {
1399         // Read the ')'.
1400         LexUnexpandedToken(Tok);
1401         if (Tok.is(tok::r_paren))
1402           IsValid = true;
1403       }
1404     }
1405 
1406     bool Value = false;
1407     if (!IsValid)
1408       Diag(StartLoc, diag::err_feature_check_malformed);
1409     else if (II == Ident__has_builtin) {
1410       // Check for a builtin is trivial.
1411       Value = FeatureII->getBuiltinID() != 0;
1412     } else if (II == Ident__has_attribute)
1413       Value = HasAttribute(FeatureII);
1414     else if (II == Ident__has_extension)
1415       Value = HasExtension(*this, FeatureII);
1416     else {
1417       assert(II == Ident__has_feature && "Must be feature check");
1418       Value = HasFeature(*this, FeatureII);
1419     }
1420 
1421     OS << (int)Value;
1422     if (IsValid)
1423       Tok.setKind(tok::numeric_constant);
1424   } else if (II == Ident__has_include ||
1425              II == Ident__has_include_next) {
1426     // The argument to these two builtins should be a parenthesized
1427     // file name string literal using angle brackets (<>) or
1428     // double-quotes ("").
1429     bool Value;
1430     if (II == Ident__has_include)
1431       Value = EvaluateHasInclude(Tok, II, *this);
1432     else
1433       Value = EvaluateHasIncludeNext(Tok, II, *this);
1434     OS << (int)Value;
1435     if (Tok.is(tok::r_paren))
1436       Tok.setKind(tok::numeric_constant);
1437   } else if (II == Ident__has_warning) {
1438     // The argument should be a parenthesized string literal.
1439     // The argument to these builtins should be a parenthesized identifier.
1440     SourceLocation StartLoc = Tok.getLocation();
1441     bool IsValid = false;
1442     bool Value = false;
1443     // Read the '('.
1444     LexUnexpandedToken(Tok);
1445     do {
1446       if (Tok.isNot(tok::l_paren)) {
1447         Diag(StartLoc, diag::err_warning_check_malformed);
1448         break;
1449       }
1450 
1451       LexUnexpandedToken(Tok);
1452       std::string WarningName;
1453       SourceLocation StrStartLoc = Tok.getLocation();
1454       if (!FinishLexStringLiteral(Tok, WarningName, "'__has_warning'",
1455                                   /*MacroExpansion=*/false)) {
1456         // Eat tokens until ')'.
1457         while (Tok.isNot(tok::r_paren) && Tok.isNot(tok::eod) &&
1458                Tok.isNot(tok::eof))
1459           LexUnexpandedToken(Tok);
1460         break;
1461       }
1462 
1463       // Is the end a ')'?
1464       if (!(IsValid = Tok.is(tok::r_paren))) {
1465         Diag(StartLoc, diag::err_warning_check_malformed);
1466         break;
1467       }
1468 
1469       if (WarningName.size() < 3 || WarningName[0] != '-' ||
1470           WarningName[1] != 'W') {
1471         Diag(StrStartLoc, diag::warn_has_warning_invalid_option);
1472         break;
1473       }
1474 
1475       // Finally, check if the warning flags maps to a diagnostic group.
1476       // We construct a SmallVector here to talk to getDiagnosticIDs().
1477       // Although we don't use the result, this isn't a hot path, and not
1478       // worth special casing.
1479       SmallVector<diag::kind, 10> Diags;
1480       Value = !getDiagnostics().getDiagnosticIDs()->
1481         getDiagnosticsInGroup(WarningName.substr(2), Diags);
1482     } while (false);
1483 
1484     OS << (int)Value;
1485     if (IsValid)
1486       Tok.setKind(tok::numeric_constant);
1487   } else if (II == Ident__building_module) {
1488     // The argument to this builtin should be an identifier. The
1489     // builtin evaluates to 1 when that identifier names the module we are
1490     // currently building.
1491     OS << (int)EvaluateBuildingModule(Tok, II, *this);
1492     Tok.setKind(tok::numeric_constant);
1493   } else if (II == Ident__MODULE__) {
1494     // The current module as an identifier.
1495     OS << getLangOpts().CurrentModule;
1496     IdentifierInfo *ModuleII = getIdentifierInfo(getLangOpts().CurrentModule);
1497     Tok.setIdentifierInfo(ModuleII);
1498     Tok.setKind(ModuleII->getTokenID());
1499   } else {
1500     llvm_unreachable("Unknown identifier!");
1501   }
1502   CreateString(OS.str(), Tok, Tok.getLocation(), Tok.getLocation());
1503 }
1504 
markMacroAsUsed(MacroInfo * MI)1505 void Preprocessor::markMacroAsUsed(MacroInfo *MI) {
1506   // If the 'used' status changed, and the macro requires 'unused' warning,
1507   // remove its SourceLocation from the warn-for-unused-macro locations.
1508   if (MI->isWarnIfUnused() && !MI->isUsed())
1509     WarnUnusedMacroLocs.erase(MI->getDefinitionLoc());
1510   MI->setIsUsed(true);
1511 }
1512