1 //===--- MacroExpansion.cpp - Top level Macro Expansion -------------------===//
2 //
3 // The LLVM Compiler Infrastructure
4 //
5 // This file is distributed under the University of Illinois Open Source
6 // License. See LICENSE.TXT for details.
7 //
8 //===----------------------------------------------------------------------===//
9 //
10 // This file implements the top level handling of macro expasion for the
11 // preprocessor.
12 //
13 //===----------------------------------------------------------------------===//
14
15 #include "clang/Lex/Preprocessor.h"
16 #include "clang/Lex/MacroArgs.h"
17 #include "clang/Basic/FileManager.h"
18 #include "clang/Basic/SourceManager.h"
19 #include "clang/Basic/TargetInfo.h"
20 #include "clang/Lex/CodeCompletionHandler.h"
21 #include "clang/Lex/ExternalPreprocessorSource.h"
22 #include "clang/Lex/LexDiagnostic.h"
23 #include "clang/Lex/MacroInfo.h"
24 #include "llvm/ADT/STLExtras.h"
25 #include "llvm/ADT/SmallString.h"
26 #include "llvm/ADT/StringSwitch.h"
27 #include "llvm/Config/llvm-config.h"
28 #include "llvm/Support/ErrorHandling.h"
29 #include "llvm/Support/Format.h"
30 #include "llvm/Support/raw_ostream.h"
31 #include <cstdio>
32 #include <ctime>
33 using namespace clang;
34
35 MacroDirective *
getMacroDirectiveHistory(const IdentifierInfo * II) const36 Preprocessor::getMacroDirectiveHistory(const IdentifierInfo *II) const {
37 assert(II->hadMacroDefinition() && "Identifier has not been not a macro!");
38
39 macro_iterator Pos = Macros.find(II);
40 assert(Pos != Macros.end() && "Identifier macro info is missing!");
41 return Pos->second;
42 }
43
appendMacroDirective(IdentifierInfo * II,MacroDirective * MD)44 void Preprocessor::appendMacroDirective(IdentifierInfo *II, MacroDirective *MD){
45 assert(MD && "MacroDirective should be non-zero!");
46 assert(!MD->getPrevious() && "Already attached to a MacroDirective history.");
47
48 MacroDirective *&StoredMD = Macros[II];
49 MD->setPrevious(StoredMD);
50 StoredMD = MD;
51 II->setHasMacroDefinition(MD->isDefined());
52 bool isImportedMacro = isa<DefMacroDirective>(MD) &&
53 cast<DefMacroDirective>(MD)->isImported();
54 if (II->isFromAST() && !isImportedMacro)
55 II->setChangedSinceDeserialization();
56 }
57
setLoadedMacroDirective(IdentifierInfo * II,MacroDirective * MD)58 void Preprocessor::setLoadedMacroDirective(IdentifierInfo *II,
59 MacroDirective *MD) {
60 assert(II && MD);
61 MacroDirective *&StoredMD = Macros[II];
62 assert(!StoredMD &&
63 "the macro history was modified before initializing it from a pch");
64 StoredMD = MD;
65 // Setup the identifier as having associated macro history.
66 II->setHasMacroDefinition(true);
67 if (!MD->isDefined())
68 II->setHasMacroDefinition(false);
69 }
70
71 /// RegisterBuiltinMacro - Register the specified identifier in the identifier
72 /// table and mark it as a builtin macro to be expanded.
RegisterBuiltinMacro(Preprocessor & PP,const char * Name)73 static IdentifierInfo *RegisterBuiltinMacro(Preprocessor &PP, const char *Name){
74 // Get the identifier.
75 IdentifierInfo *Id = PP.getIdentifierInfo(Name);
76
77 // Mark it as being a macro that is builtin.
78 MacroInfo *MI = PP.AllocateMacroInfo(SourceLocation());
79 MI->setIsBuiltinMacro();
80 PP.appendDefMacroDirective(Id, MI);
81 return Id;
82 }
83
84
85 /// RegisterBuiltinMacros - Register builtin macros, such as __LINE__ with the
86 /// identifier table.
RegisterBuiltinMacros()87 void Preprocessor::RegisterBuiltinMacros() {
88 Ident__LINE__ = RegisterBuiltinMacro(*this, "__LINE__");
89 Ident__FILE__ = RegisterBuiltinMacro(*this, "__FILE__");
90 Ident__DATE__ = RegisterBuiltinMacro(*this, "__DATE__");
91 Ident__TIME__ = RegisterBuiltinMacro(*this, "__TIME__");
92 Ident__COUNTER__ = RegisterBuiltinMacro(*this, "__COUNTER__");
93 Ident_Pragma = RegisterBuiltinMacro(*this, "_Pragma");
94
95 // GCC Extensions.
96 Ident__BASE_FILE__ = RegisterBuiltinMacro(*this, "__BASE_FILE__");
97 Ident__INCLUDE_LEVEL__ = RegisterBuiltinMacro(*this, "__INCLUDE_LEVEL__");
98 Ident__TIMESTAMP__ = RegisterBuiltinMacro(*this, "__TIMESTAMP__");
99
100 // Clang Extensions.
101 Ident__has_feature = RegisterBuiltinMacro(*this, "__has_feature");
102 Ident__has_extension = RegisterBuiltinMacro(*this, "__has_extension");
103 Ident__has_builtin = RegisterBuiltinMacro(*this, "__has_builtin");
104 Ident__has_attribute = RegisterBuiltinMacro(*this, "__has_attribute");
105 Ident__has_include = RegisterBuiltinMacro(*this, "__has_include");
106 Ident__has_include_next = RegisterBuiltinMacro(*this, "__has_include_next");
107 Ident__has_warning = RegisterBuiltinMacro(*this, "__has_warning");
108
109 // Modules.
110 if (LangOpts.Modules) {
111 Ident__building_module = RegisterBuiltinMacro(*this, "__building_module");
112
113 // __MODULE__
114 if (!LangOpts.CurrentModule.empty())
115 Ident__MODULE__ = RegisterBuiltinMacro(*this, "__MODULE__");
116 else
117 Ident__MODULE__ = 0;
118 } else {
119 Ident__building_module = 0;
120 Ident__MODULE__ = 0;
121 }
122
123 // Microsoft Extensions.
124 if (LangOpts.MicrosoftExt)
125 Ident__pragma = RegisterBuiltinMacro(*this, "__pragma");
126 else
127 Ident__pragma = 0;
128 }
129
130 /// isTrivialSingleTokenExpansion - Return true if MI, which has a single token
131 /// in its expansion, currently expands to that token literally.
isTrivialSingleTokenExpansion(const MacroInfo * MI,const IdentifierInfo * MacroIdent,Preprocessor & PP)132 static bool isTrivialSingleTokenExpansion(const MacroInfo *MI,
133 const IdentifierInfo *MacroIdent,
134 Preprocessor &PP) {
135 IdentifierInfo *II = MI->getReplacementToken(0).getIdentifierInfo();
136
137 // If the token isn't an identifier, it's always literally expanded.
138 if (II == 0) return true;
139
140 // If the information about this identifier is out of date, update it from
141 // the external source.
142 if (II->isOutOfDate())
143 PP.getExternalSource()->updateOutOfDateIdentifier(*II);
144
145 // If the identifier is a macro, and if that macro is enabled, it may be
146 // expanded so it's not a trivial expansion.
147 if (II->hasMacroDefinition() && PP.getMacroInfo(II)->isEnabled() &&
148 // Fast expanding "#define X X" is ok, because X would be disabled.
149 II != MacroIdent)
150 return false;
151
152 // If this is an object-like macro invocation, it is safe to trivially expand
153 // it.
154 if (MI->isObjectLike()) return true;
155
156 // If this is a function-like macro invocation, it's safe to trivially expand
157 // as long as the identifier is not a macro argument.
158 for (MacroInfo::arg_iterator I = MI->arg_begin(), E = MI->arg_end();
159 I != E; ++I)
160 if (*I == II)
161 return false; // Identifier is a macro argument.
162
163 return true;
164 }
165
166
167 /// isNextPPTokenLParen - Determine whether the next preprocessor token to be
168 /// lexed is a '('. If so, consume the token and return true, if not, this
169 /// method should have no observable side-effect on the lexed tokens.
isNextPPTokenLParen()170 bool Preprocessor::isNextPPTokenLParen() {
171 // Do some quick tests for rejection cases.
172 unsigned Val;
173 if (CurLexer)
174 Val = CurLexer->isNextPPTokenLParen();
175 else if (CurPTHLexer)
176 Val = CurPTHLexer->isNextPPTokenLParen();
177 else
178 Val = CurTokenLexer->isNextTokenLParen();
179
180 if (Val == 2) {
181 // We have run off the end. If it's a source file we don't
182 // examine enclosing ones (C99 5.1.1.2p4). Otherwise walk up the
183 // macro stack.
184 if (CurPPLexer)
185 return false;
186 for (unsigned i = IncludeMacroStack.size(); i != 0; --i) {
187 IncludeStackInfo &Entry = IncludeMacroStack[i-1];
188 if (Entry.TheLexer)
189 Val = Entry.TheLexer->isNextPPTokenLParen();
190 else if (Entry.ThePTHLexer)
191 Val = Entry.ThePTHLexer->isNextPPTokenLParen();
192 else
193 Val = Entry.TheTokenLexer->isNextTokenLParen();
194
195 if (Val != 2)
196 break;
197
198 // Ran off the end of a source file?
199 if (Entry.ThePPLexer)
200 return false;
201 }
202 }
203
204 // Okay, if we know that the token is a '(', lex it and return. Otherwise we
205 // have found something that isn't a '(' or we found the end of the
206 // translation unit. In either case, return false.
207 return Val == 1;
208 }
209
210 /// HandleMacroExpandedIdentifier - If an identifier token is read that is to be
211 /// expanded as a macro, handle it and return the next token as 'Identifier'.
HandleMacroExpandedIdentifier(Token & Identifier,MacroDirective * MD)212 bool Preprocessor::HandleMacroExpandedIdentifier(Token &Identifier,
213 MacroDirective *MD) {
214 MacroDirective::DefInfo Def = MD->getDefinition();
215 assert(Def.isValid());
216 MacroInfo *MI = Def.getMacroInfo();
217
218 // If this is a macro expansion in the "#if !defined(x)" line for the file,
219 // then the macro could expand to different things in other contexts, we need
220 // to disable the optimization in this case.
221 if (CurPPLexer) CurPPLexer->MIOpt.ExpandedMacro();
222
223 // If this is a builtin macro, like __LINE__ or _Pragma, handle it specially.
224 if (MI->isBuiltinMacro()) {
225 if (Callbacks) Callbacks->MacroExpands(Identifier, MD,
226 Identifier.getLocation(),/*Args=*/0);
227 ExpandBuiltinMacro(Identifier);
228 return false;
229 }
230
231 /// Args - If this is a function-like macro expansion, this contains,
232 /// for each macro argument, the list of tokens that were provided to the
233 /// invocation.
234 MacroArgs *Args = 0;
235
236 // Remember where the end of the expansion occurred. For an object-like
237 // macro, this is the identifier. For a function-like macro, this is the ')'.
238 SourceLocation ExpansionEnd = Identifier.getLocation();
239
240 // If this is a function-like macro, read the arguments.
241 if (MI->isFunctionLike()) {
242 // C99 6.10.3p10: If the preprocessing token immediately after the macro
243 // name isn't a '(', this macro should not be expanded.
244 if (!isNextPPTokenLParen())
245 return true;
246
247 // Remember that we are now parsing the arguments to a macro invocation.
248 // Preprocessor directives used inside macro arguments are not portable, and
249 // this enables the warning.
250 InMacroArgs = true;
251 Args = ReadFunctionLikeMacroArgs(Identifier, MI, ExpansionEnd);
252
253 // Finished parsing args.
254 InMacroArgs = false;
255
256 // If there was an error parsing the arguments, bail out.
257 if (Args == 0) return false;
258
259 ++NumFnMacroExpanded;
260 } else {
261 ++NumMacroExpanded;
262 }
263
264 // Notice that this macro has been used.
265 markMacroAsUsed(MI);
266
267 // Remember where the token is expanded.
268 SourceLocation ExpandLoc = Identifier.getLocation();
269 SourceRange ExpansionRange(ExpandLoc, ExpansionEnd);
270
271 if (Callbacks) {
272 if (InMacroArgs) {
273 // We can have macro expansion inside a conditional directive while
274 // reading the function macro arguments. To ensure, in that case, that
275 // MacroExpands callbacks still happen in source order, queue this
276 // callback to have it happen after the function macro callback.
277 DelayedMacroExpandsCallbacks.push_back(
278 MacroExpandsInfo(Identifier, MD, ExpansionRange));
279 } else {
280 Callbacks->MacroExpands(Identifier, MD, ExpansionRange, Args);
281 if (!DelayedMacroExpandsCallbacks.empty()) {
282 for (unsigned i=0, e = DelayedMacroExpandsCallbacks.size(); i!=e; ++i) {
283 MacroExpandsInfo &Info = DelayedMacroExpandsCallbacks[i];
284 // FIXME: We lose macro args info with delayed callback.
285 Callbacks->MacroExpands(Info.Tok, Info.MD, Info.Range, /*Args=*/0);
286 }
287 DelayedMacroExpandsCallbacks.clear();
288 }
289 }
290 }
291
292 // If the macro definition is ambiguous, complain.
293 if (Def.getDirective()->isAmbiguous()) {
294 Diag(Identifier, diag::warn_pp_ambiguous_macro)
295 << Identifier.getIdentifierInfo();
296 Diag(MI->getDefinitionLoc(), diag::note_pp_ambiguous_macro_chosen)
297 << Identifier.getIdentifierInfo();
298 for (MacroDirective::DefInfo PrevDef = Def.getPreviousDefinition();
299 PrevDef && !PrevDef.isUndefined();
300 PrevDef = PrevDef.getPreviousDefinition()) {
301 if (PrevDef.getDirective()->isAmbiguous()) {
302 Diag(PrevDef.getMacroInfo()->getDefinitionLoc(),
303 diag::note_pp_ambiguous_macro_other)
304 << Identifier.getIdentifierInfo();
305 }
306 }
307 }
308
309 // If we started lexing a macro, enter the macro expansion body.
310
311 // If this macro expands to no tokens, don't bother to push it onto the
312 // expansion stack, only to take it right back off.
313 if (MI->getNumTokens() == 0) {
314 // No need for arg info.
315 if (Args) Args->destroy(*this);
316
317 // Ignore this macro use, just return the next token in the current
318 // buffer.
319 bool HadLeadingSpace = Identifier.hasLeadingSpace();
320 bool IsAtStartOfLine = Identifier.isAtStartOfLine();
321
322 Lex(Identifier);
323
324 // If the identifier isn't on some OTHER line, inherit the leading
325 // whitespace/first-on-a-line property of this token. This handles
326 // stuff like "! XX," -> "! ," and " XX," -> " ,", when XX is
327 // empty.
328 if (!Identifier.isAtStartOfLine()) {
329 if (IsAtStartOfLine) Identifier.setFlag(Token::StartOfLine);
330 if (HadLeadingSpace) Identifier.setFlag(Token::LeadingSpace);
331 }
332 Identifier.setFlag(Token::LeadingEmptyMacro);
333 ++NumFastMacroExpanded;
334 return false;
335
336 } else if (MI->getNumTokens() == 1 &&
337 isTrivialSingleTokenExpansion(MI, Identifier.getIdentifierInfo(),
338 *this)) {
339 // Otherwise, if this macro expands into a single trivially-expanded
340 // token: expand it now. This handles common cases like
341 // "#define VAL 42".
342
343 // No need for arg info.
344 if (Args) Args->destroy(*this);
345
346 // Propagate the isAtStartOfLine/hasLeadingSpace markers of the macro
347 // identifier to the expanded token.
348 bool isAtStartOfLine = Identifier.isAtStartOfLine();
349 bool hasLeadingSpace = Identifier.hasLeadingSpace();
350
351 // Replace the result token.
352 Identifier = MI->getReplacementToken(0);
353
354 // Restore the StartOfLine/LeadingSpace markers.
355 Identifier.setFlagValue(Token::StartOfLine , isAtStartOfLine);
356 Identifier.setFlagValue(Token::LeadingSpace, hasLeadingSpace);
357
358 // Update the tokens location to include both its expansion and physical
359 // locations.
360 SourceLocation Loc =
361 SourceMgr.createExpansionLoc(Identifier.getLocation(), ExpandLoc,
362 ExpansionEnd,Identifier.getLength());
363 Identifier.setLocation(Loc);
364
365 // If this is a disabled macro or #define X X, we must mark the result as
366 // unexpandable.
367 if (IdentifierInfo *NewII = Identifier.getIdentifierInfo()) {
368 if (MacroInfo *NewMI = getMacroInfo(NewII))
369 if (!NewMI->isEnabled() || NewMI == MI) {
370 Identifier.setFlag(Token::DisableExpand);
371 // Don't warn for "#define X X" like "#define bool bool" from
372 // stdbool.h.
373 if (NewMI != MI || MI->isFunctionLike())
374 Diag(Identifier, diag::pp_disabled_macro_expansion);
375 }
376 }
377
378 // Since this is not an identifier token, it can't be macro expanded, so
379 // we're done.
380 ++NumFastMacroExpanded;
381 return false;
382 }
383
384 // Start expanding the macro.
385 EnterMacro(Identifier, ExpansionEnd, MI, Args);
386
387 // Now that the macro is at the top of the include stack, ask the
388 // preprocessor to read the next token from it.
389 Lex(Identifier);
390 return false;
391 }
392
393 enum Bracket {
394 Brace,
395 Paren
396 };
397
398 /// CheckMatchedBrackets - Returns true if the braces and parentheses in the
399 /// token vector are properly nested.
CheckMatchedBrackets(const SmallVectorImpl<Token> & Tokens)400 static bool CheckMatchedBrackets(const SmallVectorImpl<Token> &Tokens) {
401 SmallVector<Bracket, 8> Brackets;
402 for (SmallVectorImpl<Token>::const_iterator I = Tokens.begin(),
403 E = Tokens.end();
404 I != E; ++I) {
405 if (I->is(tok::l_paren)) {
406 Brackets.push_back(Paren);
407 } else if (I->is(tok::r_paren)) {
408 if (Brackets.empty() || Brackets.back() == Brace)
409 return false;
410 Brackets.pop_back();
411 } else if (I->is(tok::l_brace)) {
412 Brackets.push_back(Brace);
413 } else if (I->is(tok::r_brace)) {
414 if (Brackets.empty() || Brackets.back() == Paren)
415 return false;
416 Brackets.pop_back();
417 }
418 }
419 if (!Brackets.empty())
420 return false;
421 return true;
422 }
423
424 /// GenerateNewArgTokens - Returns true if OldTokens can be converted to a new
425 /// vector of tokens in NewTokens. The new number of arguments will be placed
426 /// in NumArgs and the ranges which need to surrounded in parentheses will be
427 /// in ParenHints.
428 /// Returns false if the token stream cannot be changed. If this is because
429 /// of an initializer list starting a macro argument, the range of those
430 /// initializer lists will be place in InitLists.
GenerateNewArgTokens(Preprocessor & PP,SmallVectorImpl<Token> & OldTokens,SmallVectorImpl<Token> & NewTokens,unsigned & NumArgs,SmallVectorImpl<SourceRange> & ParenHints,SmallVectorImpl<SourceRange> & InitLists)431 static bool GenerateNewArgTokens(Preprocessor &PP,
432 SmallVectorImpl<Token> &OldTokens,
433 SmallVectorImpl<Token> &NewTokens,
434 unsigned &NumArgs,
435 SmallVectorImpl<SourceRange> &ParenHints,
436 SmallVectorImpl<SourceRange> &InitLists) {
437 if (!CheckMatchedBrackets(OldTokens))
438 return false;
439
440 // Once it is known that the brackets are matched, only a simple count of the
441 // braces is needed.
442 unsigned Braces = 0;
443
444 // First token of a new macro argument.
445 SmallVectorImpl<Token>::iterator ArgStartIterator = OldTokens.begin();
446
447 // First closing brace in a new macro argument. Used to generate
448 // SourceRanges for InitLists.
449 SmallVectorImpl<Token>::iterator ClosingBrace = OldTokens.end();
450 NumArgs = 0;
451 Token TempToken;
452 // Set to true when a macro separator token is found inside a braced list.
453 // If true, the fixed argument spans multiple old arguments and ParenHints
454 // will be updated.
455 bool FoundSeparatorToken = false;
456 for (SmallVectorImpl<Token>::iterator I = OldTokens.begin(),
457 E = OldTokens.end();
458 I != E; ++I) {
459 if (I->is(tok::l_brace)) {
460 ++Braces;
461 } else if (I->is(tok::r_brace)) {
462 --Braces;
463 if (Braces == 0 && ClosingBrace == E && FoundSeparatorToken)
464 ClosingBrace = I;
465 } else if (I->is(tok::eof)) {
466 // EOF token is used to separate macro arguments
467 if (Braces != 0) {
468 // Assume comma separator is actually braced list separator and change
469 // it back to a comma.
470 FoundSeparatorToken = true;
471 I->setKind(tok::comma);
472 I->setLength(1);
473 } else { // Braces == 0
474 // Separator token still separates arguments.
475 ++NumArgs;
476
477 // If the argument starts with a brace, it can't be fixed with
478 // parentheses. A different diagnostic will be given.
479 if (FoundSeparatorToken && ArgStartIterator->is(tok::l_brace)) {
480 InitLists.push_back(
481 SourceRange(ArgStartIterator->getLocation(),
482 PP.getLocForEndOfToken(ClosingBrace->getLocation())));
483 ClosingBrace = E;
484 }
485
486 // Add left paren
487 if (FoundSeparatorToken) {
488 TempToken.startToken();
489 TempToken.setKind(tok::l_paren);
490 TempToken.setLocation(ArgStartIterator->getLocation());
491 TempToken.setLength(0);
492 NewTokens.push_back(TempToken);
493 }
494
495 // Copy over argument tokens
496 NewTokens.insert(NewTokens.end(), ArgStartIterator, I);
497
498 // Add right paren and store the paren locations in ParenHints
499 if (FoundSeparatorToken) {
500 SourceLocation Loc = PP.getLocForEndOfToken((I - 1)->getLocation());
501 TempToken.startToken();
502 TempToken.setKind(tok::r_paren);
503 TempToken.setLocation(Loc);
504 TempToken.setLength(0);
505 NewTokens.push_back(TempToken);
506 ParenHints.push_back(SourceRange(ArgStartIterator->getLocation(),
507 Loc));
508 }
509
510 // Copy separator token
511 NewTokens.push_back(*I);
512
513 // Reset values
514 ArgStartIterator = I + 1;
515 FoundSeparatorToken = false;
516 }
517 }
518 }
519
520 return !ParenHints.empty() && InitLists.empty();
521 }
522
523 /// ReadFunctionLikeMacroArgs - After reading "MACRO" and knowing that the next
524 /// token is the '(' of the macro, this method is invoked to read all of the
525 /// actual arguments specified for the macro invocation. This returns null on
526 /// error.
ReadFunctionLikeMacroArgs(Token & MacroName,MacroInfo * MI,SourceLocation & MacroEnd)527 MacroArgs *Preprocessor::ReadFunctionLikeMacroArgs(Token &MacroName,
528 MacroInfo *MI,
529 SourceLocation &MacroEnd) {
530 // The number of fixed arguments to parse.
531 unsigned NumFixedArgsLeft = MI->getNumArgs();
532 bool isVariadic = MI->isVariadic();
533
534 // Outer loop, while there are more arguments, keep reading them.
535 Token Tok;
536
537 // Read arguments as unexpanded tokens. This avoids issues, e.g., where
538 // an argument value in a macro could expand to ',' or '(' or ')'.
539 LexUnexpandedToken(Tok);
540 assert(Tok.is(tok::l_paren) && "Error computing l-paren-ness?");
541
542 // ArgTokens - Build up a list of tokens that make up each argument. Each
543 // argument is separated by an EOF token. Use a SmallVector so we can avoid
544 // heap allocations in the common case.
545 SmallVector<Token, 64> ArgTokens;
546 bool ContainsCodeCompletionTok = false;
547
548 SourceLocation TooManyArgsLoc;
549
550 unsigned NumActuals = 0;
551 while (Tok.isNot(tok::r_paren)) {
552 if (ContainsCodeCompletionTok && (Tok.is(tok::eof) || Tok.is(tok::eod)))
553 break;
554
555 assert((Tok.is(tok::l_paren) || Tok.is(tok::comma)) &&
556 "only expect argument separators here");
557
558 unsigned ArgTokenStart = ArgTokens.size();
559 SourceLocation ArgStartLoc = Tok.getLocation();
560
561 // C99 6.10.3p11: Keep track of the number of l_parens we have seen. Note
562 // that we already consumed the first one.
563 unsigned NumParens = 0;
564
565 while (1) {
566 // Read arguments as unexpanded tokens. This avoids issues, e.g., where
567 // an argument value in a macro could expand to ',' or '(' or ')'.
568 LexUnexpandedToken(Tok);
569
570 if (Tok.is(tok::eof) || Tok.is(tok::eod)) { // "#if f(<eof>" & "#if f(\n"
571 if (!ContainsCodeCompletionTok) {
572 Diag(MacroName, diag::err_unterm_macro_invoc);
573 Diag(MI->getDefinitionLoc(), diag::note_macro_here)
574 << MacroName.getIdentifierInfo();
575 // Do not lose the EOF/EOD. Return it to the client.
576 MacroName = Tok;
577 return 0;
578 } else {
579 // Do not lose the EOF/EOD.
580 Token *Toks = new Token[1];
581 Toks[0] = Tok;
582 EnterTokenStream(Toks, 1, true, true);
583 break;
584 }
585 } else if (Tok.is(tok::r_paren)) {
586 // If we found the ) token, the macro arg list is done.
587 if (NumParens-- == 0) {
588 MacroEnd = Tok.getLocation();
589 break;
590 }
591 } else if (Tok.is(tok::l_paren)) {
592 ++NumParens;
593 } else if (Tok.is(tok::comma) && NumParens == 0 &&
594 !(Tok.getFlags() & Token::IgnoredComma)) {
595 // In Microsoft-compatibility mode, single commas from nested macro
596 // expansions should not be considered as argument separators. We test
597 // for this with the IgnoredComma token flag above.
598
599 // Comma ends this argument if there are more fixed arguments expected.
600 // However, if this is a variadic macro, and this is part of the
601 // variadic part, then the comma is just an argument token.
602 if (!isVariadic) break;
603 if (NumFixedArgsLeft > 1)
604 break;
605 } else if (Tok.is(tok::comment) && !KeepMacroComments) {
606 // If this is a comment token in the argument list and we're just in
607 // -C mode (not -CC mode), discard the comment.
608 continue;
609 } else if (Tok.getIdentifierInfo() != 0) {
610 // Reading macro arguments can cause macros that we are currently
611 // expanding from to be popped off the expansion stack. Doing so causes
612 // them to be reenabled for expansion. Here we record whether any
613 // identifiers we lex as macro arguments correspond to disabled macros.
614 // If so, we mark the token as noexpand. This is a subtle aspect of
615 // C99 6.10.3.4p2.
616 if (MacroInfo *MI = getMacroInfo(Tok.getIdentifierInfo()))
617 if (!MI->isEnabled())
618 Tok.setFlag(Token::DisableExpand);
619 } else if (Tok.is(tok::code_completion)) {
620 ContainsCodeCompletionTok = true;
621 if (CodeComplete)
622 CodeComplete->CodeCompleteMacroArgument(MacroName.getIdentifierInfo(),
623 MI, NumActuals);
624 // Don't mark that we reached the code-completion point because the
625 // parser is going to handle the token and there will be another
626 // code-completion callback.
627 }
628
629 ArgTokens.push_back(Tok);
630 }
631
632 // If this was an empty argument list foo(), don't add this as an empty
633 // argument.
634 if (ArgTokens.empty() && Tok.getKind() == tok::r_paren)
635 break;
636
637 // If this is not a variadic macro, and too many args were specified, emit
638 // an error.
639 if (!isVariadic && NumFixedArgsLeft == 0 && TooManyArgsLoc.isInvalid()) {
640 if (ArgTokens.size() != ArgTokenStart)
641 TooManyArgsLoc = ArgTokens[ArgTokenStart].getLocation();
642 else
643 TooManyArgsLoc = ArgStartLoc;
644 }
645
646 // Empty arguments are standard in C99 and C++0x, and are supported as an
647 // extension in other modes.
648 if (ArgTokens.size() == ArgTokenStart && !LangOpts.C99)
649 Diag(Tok, LangOpts.CPlusPlus11 ?
650 diag::warn_cxx98_compat_empty_fnmacro_arg :
651 diag::ext_empty_fnmacro_arg);
652
653 // Add a marker EOF token to the end of the token list for this argument.
654 Token EOFTok;
655 EOFTok.startToken();
656 EOFTok.setKind(tok::eof);
657 EOFTok.setLocation(Tok.getLocation());
658 EOFTok.setLength(0);
659 ArgTokens.push_back(EOFTok);
660 ++NumActuals;
661 if (!ContainsCodeCompletionTok && NumFixedArgsLeft != 0)
662 --NumFixedArgsLeft;
663 }
664
665 // Okay, we either found the r_paren. Check to see if we parsed too few
666 // arguments.
667 unsigned MinArgsExpected = MI->getNumArgs();
668
669 // If this is not a variadic macro, and too many args were specified, emit
670 // an error.
671 if (!isVariadic && NumActuals > MinArgsExpected &&
672 !ContainsCodeCompletionTok) {
673 // Emit the diagnostic at the macro name in case there is a missing ).
674 // Emitting it at the , could be far away from the macro name.
675 Diag(TooManyArgsLoc, diag::err_too_many_args_in_macro_invoc);
676 Diag(MI->getDefinitionLoc(), diag::note_macro_here)
677 << MacroName.getIdentifierInfo();
678
679 // Commas from braced initializer lists will be treated as argument
680 // separators inside macros. Attempt to correct for this with parentheses.
681 // TODO: See if this can be generalized to angle brackets for templates
682 // inside macro arguments.
683
684 SmallVector<Token, 4> FixedArgTokens;
685 unsigned FixedNumArgs = 0;
686 SmallVector<SourceRange, 4> ParenHints, InitLists;
687 if (!GenerateNewArgTokens(*this, ArgTokens, FixedArgTokens, FixedNumArgs,
688 ParenHints, InitLists)) {
689 if (!InitLists.empty()) {
690 DiagnosticBuilder DB =
691 Diag(MacroName,
692 diag::note_init_list_at_beginning_of_macro_argument);
693 for (SmallVector<SourceRange, 4>::iterator
694 Range = InitLists.begin(), RangeEnd = InitLists.end();
695 Range != RangeEnd; ++Range) {
696 if (DB.hasMaxRanges())
697 break;
698 DB << *Range;
699 }
700 }
701 return 0;
702 }
703 if (FixedNumArgs != MinArgsExpected)
704 return 0;
705
706 DiagnosticBuilder DB = Diag(MacroName, diag::note_suggest_parens_for_macro);
707 for (SmallVector<SourceRange, 4>::iterator
708 ParenLocation = ParenHints.begin(), ParenEnd = ParenHints.end();
709 ParenLocation != ParenEnd; ++ParenLocation) {
710 if (DB.hasMaxFixItHints())
711 break;
712 DB << FixItHint::CreateInsertion(ParenLocation->getBegin(), "(");
713 if (DB.hasMaxFixItHints())
714 break;
715 DB << FixItHint::CreateInsertion(ParenLocation->getEnd(), ")");
716 }
717 ArgTokens.swap(FixedArgTokens);
718 NumActuals = FixedNumArgs;
719 }
720
721 // See MacroArgs instance var for description of this.
722 bool isVarargsElided = false;
723
724 if (ContainsCodeCompletionTok) {
725 // Recover from not-fully-formed macro invocation during code-completion.
726 Token EOFTok;
727 EOFTok.startToken();
728 EOFTok.setKind(tok::eof);
729 EOFTok.setLocation(Tok.getLocation());
730 EOFTok.setLength(0);
731 for (; NumActuals < MinArgsExpected; ++NumActuals)
732 ArgTokens.push_back(EOFTok);
733 }
734
735 if (NumActuals < MinArgsExpected) {
736 // There are several cases where too few arguments is ok, handle them now.
737 if (NumActuals == 0 && MinArgsExpected == 1) {
738 // #define A(X) or #define A(...) ---> A()
739
740 // If there is exactly one argument, and that argument is missing,
741 // then we have an empty "()" argument empty list. This is fine, even if
742 // the macro expects one argument (the argument is just empty).
743 isVarargsElided = MI->isVariadic();
744 } else if (MI->isVariadic() &&
745 (NumActuals+1 == MinArgsExpected || // A(x, ...) -> A(X)
746 (NumActuals == 0 && MinArgsExpected == 2))) {// A(x,...) -> A()
747 // Varargs where the named vararg parameter is missing: OK as extension.
748 // #define A(x, ...)
749 // A("blah")
750 //
751 // If the macro contains the comma pasting extension, the diagnostic
752 // is suppressed; we know we'll get another diagnostic later.
753 if (!MI->hasCommaPasting()) {
754 Diag(Tok, diag::ext_missing_varargs_arg);
755 Diag(MI->getDefinitionLoc(), diag::note_macro_here)
756 << MacroName.getIdentifierInfo();
757 }
758
759 // Remember this occurred, allowing us to elide the comma when used for
760 // cases like:
761 // #define A(x, foo...) blah(a, ## foo)
762 // #define B(x, ...) blah(a, ## __VA_ARGS__)
763 // #define C(...) blah(a, ## __VA_ARGS__)
764 // A(x) B(x) C()
765 isVarargsElided = true;
766 } else if (!ContainsCodeCompletionTok) {
767 // Otherwise, emit the error.
768 Diag(Tok, diag::err_too_few_args_in_macro_invoc);
769 Diag(MI->getDefinitionLoc(), diag::note_macro_here)
770 << MacroName.getIdentifierInfo();
771 return 0;
772 }
773
774 // Add a marker EOF token to the end of the token list for this argument.
775 SourceLocation EndLoc = Tok.getLocation();
776 Tok.startToken();
777 Tok.setKind(tok::eof);
778 Tok.setLocation(EndLoc);
779 Tok.setLength(0);
780 ArgTokens.push_back(Tok);
781
782 // If we expect two arguments, add both as empty.
783 if (NumActuals == 0 && MinArgsExpected == 2)
784 ArgTokens.push_back(Tok);
785
786 } else if (NumActuals > MinArgsExpected && !MI->isVariadic() &&
787 !ContainsCodeCompletionTok) {
788 // Emit the diagnostic at the macro name in case there is a missing ).
789 // Emitting it at the , could be far away from the macro name.
790 Diag(MacroName, diag::err_too_many_args_in_macro_invoc);
791 Diag(MI->getDefinitionLoc(), diag::note_macro_here)
792 << MacroName.getIdentifierInfo();
793 return 0;
794 }
795
796 return MacroArgs::create(MI, ArgTokens, isVarargsElided, *this);
797 }
798
799 /// \brief Keeps macro expanded tokens for TokenLexers.
800 //
801 /// Works like a stack; a TokenLexer adds the macro expanded tokens that is
802 /// going to lex in the cache and when it finishes the tokens are removed
803 /// from the end of the cache.
cacheMacroExpandedTokens(TokenLexer * tokLexer,ArrayRef<Token> tokens)804 Token *Preprocessor::cacheMacroExpandedTokens(TokenLexer *tokLexer,
805 ArrayRef<Token> tokens) {
806 assert(tokLexer);
807 if (tokens.empty())
808 return 0;
809
810 size_t newIndex = MacroExpandedTokens.size();
811 bool cacheNeedsToGrow = tokens.size() >
812 MacroExpandedTokens.capacity()-MacroExpandedTokens.size();
813 MacroExpandedTokens.append(tokens.begin(), tokens.end());
814
815 if (cacheNeedsToGrow) {
816 // Go through all the TokenLexers whose 'Tokens' pointer points in the
817 // buffer and update the pointers to the (potential) new buffer array.
818 for (unsigned i = 0, e = MacroExpandingLexersStack.size(); i != e; ++i) {
819 TokenLexer *prevLexer;
820 size_t tokIndex;
821 llvm::tie(prevLexer, tokIndex) = MacroExpandingLexersStack[i];
822 prevLexer->Tokens = MacroExpandedTokens.data() + tokIndex;
823 }
824 }
825
826 MacroExpandingLexersStack.push_back(std::make_pair(tokLexer, newIndex));
827 return MacroExpandedTokens.data() + newIndex;
828 }
829
removeCachedMacroExpandedTokensOfLastLexer()830 void Preprocessor::removeCachedMacroExpandedTokensOfLastLexer() {
831 assert(!MacroExpandingLexersStack.empty());
832 size_t tokIndex = MacroExpandingLexersStack.back().second;
833 assert(tokIndex < MacroExpandedTokens.size());
834 // Pop the cached macro expanded tokens from the end.
835 MacroExpandedTokens.resize(tokIndex);
836 MacroExpandingLexersStack.pop_back();
837 }
838
839 /// ComputeDATE_TIME - Compute the current time, enter it into the specified
840 /// scratch buffer, then return DATELoc/TIMELoc locations with the position of
841 /// the identifier tokens inserted.
ComputeDATE_TIME(SourceLocation & DATELoc,SourceLocation & TIMELoc,Preprocessor & PP)842 static void ComputeDATE_TIME(SourceLocation &DATELoc, SourceLocation &TIMELoc,
843 Preprocessor &PP) {
844 time_t TT = time(0);
845 struct tm *TM = localtime(&TT);
846
847 static const char * const Months[] = {
848 "Jan","Feb","Mar","Apr","May","Jun","Jul","Aug","Sep","Oct","Nov","Dec"
849 };
850
851 {
852 SmallString<32> TmpBuffer;
853 llvm::raw_svector_ostream TmpStream(TmpBuffer);
854 TmpStream << llvm::format("\"%s %2d %4d\"", Months[TM->tm_mon],
855 TM->tm_mday, TM->tm_year + 1900);
856 Token TmpTok;
857 TmpTok.startToken();
858 PP.CreateString(TmpStream.str(), TmpTok);
859 DATELoc = TmpTok.getLocation();
860 }
861
862 {
863 SmallString<32> TmpBuffer;
864 llvm::raw_svector_ostream TmpStream(TmpBuffer);
865 TmpStream << llvm::format("\"%02d:%02d:%02d\"",
866 TM->tm_hour, TM->tm_min, TM->tm_sec);
867 Token TmpTok;
868 TmpTok.startToken();
869 PP.CreateString(TmpStream.str(), TmpTok);
870 TIMELoc = TmpTok.getLocation();
871 }
872 }
873
874
875 /// HasFeature - Return true if we recognize and implement the feature
876 /// specified by the identifier as a standard language feature.
HasFeature(const Preprocessor & PP,const IdentifierInfo * II)877 static bool HasFeature(const Preprocessor &PP, const IdentifierInfo *II) {
878 const LangOptions &LangOpts = PP.getLangOpts();
879 StringRef Feature = II->getName();
880
881 // Normalize the feature name, __foo__ becomes foo.
882 if (Feature.startswith("__") && Feature.endswith("__") && Feature.size() >= 4)
883 Feature = Feature.substr(2, Feature.size() - 4);
884
885 return llvm::StringSwitch<bool>(Feature)
886 .Case("address_sanitizer", LangOpts.Sanitize.Address)
887 .Case("attribute_analyzer_noreturn", true)
888 .Case("attribute_availability", true)
889 .Case("attribute_availability_with_message", true)
890 .Case("attribute_cf_returns_not_retained", true)
891 .Case("attribute_cf_returns_retained", true)
892 .Case("attribute_deprecated_with_message", true)
893 .Case("attribute_ext_vector_type", true)
894 .Case("attribute_ns_returns_not_retained", true)
895 .Case("attribute_ns_returns_retained", true)
896 .Case("attribute_ns_consumes_self", true)
897 .Case("attribute_ns_consumed", true)
898 .Case("attribute_cf_consumed", true)
899 .Case("attribute_objc_ivar_unused", true)
900 .Case("attribute_objc_method_family", true)
901 .Case("attribute_overloadable", true)
902 .Case("attribute_unavailable_with_message", true)
903 .Case("attribute_unused_on_fields", true)
904 .Case("blocks", LangOpts.Blocks)
905 .Case("c_thread_safety_attributes", true)
906 .Case("cxx_exceptions", LangOpts.Exceptions)
907 .Case("cxx_rtti", LangOpts.RTTI)
908 .Case("enumerator_attributes", true)
909 .Case("memory_sanitizer", LangOpts.Sanitize.Memory)
910 .Case("thread_sanitizer", LangOpts.Sanitize.Thread)
911 // Objective-C features
912 .Case("objc_arr", LangOpts.ObjCAutoRefCount) // FIXME: REMOVE?
913 .Case("objc_arc", LangOpts.ObjCAutoRefCount)
914 .Case("objc_arc_weak", LangOpts.ObjCARCWeak)
915 .Case("objc_default_synthesize_properties", LangOpts.ObjC2)
916 .Case("objc_fixed_enum", LangOpts.ObjC2)
917 .Case("objc_instancetype", LangOpts.ObjC2)
918 .Case("objc_modules", LangOpts.ObjC2 && LangOpts.Modules)
919 .Case("objc_nonfragile_abi", LangOpts.ObjCRuntime.isNonFragile())
920 .Case("objc_property_explicit_atomic", true) // Does clang support explicit "atomic" keyword?
921 .Case("objc_weak_class", LangOpts.ObjCRuntime.hasWeakClassImport())
922 .Case("objc_msg_lookup_stret", LangOpts.ObjCRuntime.getKind() == ObjCRuntime::ObjFW)
923 .Case("ownership_holds", true)
924 .Case("ownership_returns", true)
925 .Case("ownership_takes", true)
926 .Case("objc_bool", true)
927 .Case("objc_subscripting", LangOpts.ObjCRuntime.isNonFragile())
928 .Case("objc_array_literals", LangOpts.ObjC2)
929 .Case("objc_dictionary_literals", LangOpts.ObjC2)
930 .Case("objc_boxed_expressions", LangOpts.ObjC2)
931 .Case("arc_cf_code_audited", true)
932 // C11 features
933 .Case("c_alignas", LangOpts.C11)
934 .Case("c_atomic", LangOpts.C11)
935 .Case("c_generic_selections", LangOpts.C11)
936 .Case("c_static_assert", LangOpts.C11)
937 .Case("c_thread_local",
938 LangOpts.C11 && PP.getTargetInfo().isTLSSupported())
939 // C++11 features
940 .Case("cxx_access_control_sfinae", LangOpts.CPlusPlus11)
941 .Case("cxx_alias_templates", LangOpts.CPlusPlus11)
942 .Case("cxx_alignas", LangOpts.CPlusPlus11)
943 .Case("cxx_atomic", LangOpts.CPlusPlus11)
944 .Case("cxx_attributes", LangOpts.CPlusPlus11)
945 .Case("cxx_auto_type", LangOpts.CPlusPlus11)
946 .Case("cxx_constexpr", LangOpts.CPlusPlus11)
947 .Case("cxx_decltype", LangOpts.CPlusPlus11)
948 .Case("cxx_decltype_incomplete_return_types", LangOpts.CPlusPlus11)
949 .Case("cxx_default_function_template_args", LangOpts.CPlusPlus11)
950 .Case("cxx_defaulted_functions", LangOpts.CPlusPlus11)
951 .Case("cxx_delegating_constructors", LangOpts.CPlusPlus11)
952 .Case("cxx_deleted_functions", LangOpts.CPlusPlus11)
953 .Case("cxx_explicit_conversions", LangOpts.CPlusPlus11)
954 .Case("cxx_generalized_initializers", LangOpts.CPlusPlus11)
955 .Case("cxx_implicit_moves", LangOpts.CPlusPlus11)
956 .Case("cxx_inheriting_constructors", LangOpts.CPlusPlus11)
957 .Case("cxx_inline_namespaces", LangOpts.CPlusPlus11)
958 .Case("cxx_lambdas", LangOpts.CPlusPlus11)
959 .Case("cxx_local_type_template_args", LangOpts.CPlusPlus11)
960 .Case("cxx_nonstatic_member_init", LangOpts.CPlusPlus11)
961 .Case("cxx_noexcept", LangOpts.CPlusPlus11)
962 .Case("cxx_nullptr", LangOpts.CPlusPlus11)
963 .Case("cxx_override_control", LangOpts.CPlusPlus11)
964 .Case("cxx_range_for", LangOpts.CPlusPlus11)
965 .Case("cxx_raw_string_literals", LangOpts.CPlusPlus11)
966 .Case("cxx_reference_qualified_functions", LangOpts.CPlusPlus11)
967 .Case("cxx_rvalue_references", LangOpts.CPlusPlus11)
968 .Case("cxx_strong_enums", LangOpts.CPlusPlus11)
969 .Case("cxx_static_assert", LangOpts.CPlusPlus11)
970 .Case("cxx_thread_local",
971 LangOpts.CPlusPlus11 && PP.getTargetInfo().isTLSSupported())
972 .Case("cxx_trailing_return", LangOpts.CPlusPlus11)
973 .Case("cxx_unicode_literals", LangOpts.CPlusPlus11)
974 .Case("cxx_unrestricted_unions", LangOpts.CPlusPlus11)
975 .Case("cxx_user_literals", LangOpts.CPlusPlus11)
976 .Case("cxx_variadic_templates", LangOpts.CPlusPlus11)
977 // C++1y features
978 .Case("cxx_aggregate_nsdmi", LangOpts.CPlusPlus1y)
979 .Case("cxx_binary_literals", LangOpts.CPlusPlus1y)
980 .Case("cxx_contextual_conversions", LangOpts.CPlusPlus1y)
981 //.Case("cxx_generic_lambda", LangOpts.CPlusPlus1y)
982 //.Case("cxx_init_capture", LangOpts.CPlusPlus1y)
983 .Case("cxx_relaxed_constexpr", LangOpts.CPlusPlus1y)
984 .Case("cxx_return_type_deduction", LangOpts.CPlusPlus1y)
985 //.Case("cxx_runtime_array", LangOpts.CPlusPlus1y)
986 //.Case("cxx_variable_templates", LangOpts.CPlusPlus1y)
987 // Type traits
988 .Case("has_nothrow_assign", LangOpts.CPlusPlus)
989 .Case("has_nothrow_copy", LangOpts.CPlusPlus)
990 .Case("has_nothrow_constructor", LangOpts.CPlusPlus)
991 .Case("has_trivial_assign", LangOpts.CPlusPlus)
992 .Case("has_trivial_copy", LangOpts.CPlusPlus)
993 .Case("has_trivial_constructor", LangOpts.CPlusPlus)
994 .Case("has_trivial_destructor", LangOpts.CPlusPlus)
995 .Case("has_virtual_destructor", LangOpts.CPlusPlus)
996 .Case("is_abstract", LangOpts.CPlusPlus)
997 .Case("is_base_of", LangOpts.CPlusPlus)
998 .Case("is_class", LangOpts.CPlusPlus)
999 .Case("is_convertible_to", LangOpts.CPlusPlus)
1000 .Case("is_empty", LangOpts.CPlusPlus)
1001 .Case("is_enum", LangOpts.CPlusPlus)
1002 .Case("is_final", LangOpts.CPlusPlus)
1003 .Case("is_literal", LangOpts.CPlusPlus)
1004 .Case("is_standard_layout", LangOpts.CPlusPlus)
1005 .Case("is_pod", LangOpts.CPlusPlus)
1006 .Case("is_polymorphic", LangOpts.CPlusPlus)
1007 .Case("is_trivial", LangOpts.CPlusPlus)
1008 .Case("is_trivially_assignable", LangOpts.CPlusPlus)
1009 .Case("is_trivially_constructible", LangOpts.CPlusPlus)
1010 .Case("is_trivially_copyable", LangOpts.CPlusPlus)
1011 .Case("is_union", LangOpts.CPlusPlus)
1012 .Case("modules", LangOpts.Modules)
1013 .Case("tls", PP.getTargetInfo().isTLSSupported())
1014 .Case("underlying_type", LangOpts.CPlusPlus)
1015 .Default(false);
1016 }
1017
1018 /// HasExtension - Return true if we recognize and implement the feature
1019 /// specified by the identifier, either as an extension or a standard language
1020 /// feature.
HasExtension(const Preprocessor & PP,const IdentifierInfo * II)1021 static bool HasExtension(const Preprocessor &PP, const IdentifierInfo *II) {
1022 if (HasFeature(PP, II))
1023 return true;
1024
1025 // If the use of an extension results in an error diagnostic, extensions are
1026 // effectively unavailable, so just return false here.
1027 if (PP.getDiagnostics().getExtensionHandlingBehavior() ==
1028 DiagnosticsEngine::Ext_Error)
1029 return false;
1030
1031 const LangOptions &LangOpts = PP.getLangOpts();
1032 StringRef Extension = II->getName();
1033
1034 // Normalize the extension name, __foo__ becomes foo.
1035 if (Extension.startswith("__") && Extension.endswith("__") &&
1036 Extension.size() >= 4)
1037 Extension = Extension.substr(2, Extension.size() - 4);
1038
1039 // Because we inherit the feature list from HasFeature, this string switch
1040 // must be less restrictive than HasFeature's.
1041 return llvm::StringSwitch<bool>(Extension)
1042 // C11 features supported by other languages as extensions.
1043 .Case("c_alignas", true)
1044 .Case("c_atomic", true)
1045 .Case("c_generic_selections", true)
1046 .Case("c_static_assert", true)
1047 // C++11 features supported by other languages as extensions.
1048 .Case("cxx_atomic", LangOpts.CPlusPlus)
1049 .Case("cxx_deleted_functions", LangOpts.CPlusPlus)
1050 .Case("cxx_explicit_conversions", LangOpts.CPlusPlus)
1051 .Case("cxx_inline_namespaces", LangOpts.CPlusPlus)
1052 .Case("cxx_local_type_template_args", LangOpts.CPlusPlus)
1053 .Case("cxx_nonstatic_member_init", LangOpts.CPlusPlus)
1054 .Case("cxx_override_control", LangOpts.CPlusPlus)
1055 .Case("cxx_range_for", LangOpts.CPlusPlus)
1056 .Case("cxx_reference_qualified_functions", LangOpts.CPlusPlus)
1057 .Case("cxx_rvalue_references", LangOpts.CPlusPlus)
1058 // C++1y features supported by other languages as extensions.
1059 .Case("cxx_binary_literals", true)
1060 .Default(false);
1061 }
1062
1063 /// HasAttribute - Return true if we recognize and implement the attribute
1064 /// specified by the given identifier.
HasAttribute(const IdentifierInfo * II)1065 static bool HasAttribute(const IdentifierInfo *II) {
1066 StringRef Name = II->getName();
1067 // Normalize the attribute name, __foo__ becomes foo.
1068 if (Name.startswith("__") && Name.endswith("__") && Name.size() >= 4)
1069 Name = Name.substr(2, Name.size() - 4);
1070
1071 // FIXME: Do we need to handle namespaces here?
1072 return llvm::StringSwitch<bool>(Name)
1073 #include "clang/Lex/AttrSpellings.inc"
1074 .Default(false);
1075 }
1076
1077 /// EvaluateHasIncludeCommon - Process a '__has_include("path")'
1078 /// or '__has_include_next("path")' expression.
1079 /// Returns true if successful.
EvaluateHasIncludeCommon(Token & Tok,IdentifierInfo * II,Preprocessor & PP,const DirectoryLookup * LookupFrom)1080 static bool EvaluateHasIncludeCommon(Token &Tok,
1081 IdentifierInfo *II, Preprocessor &PP,
1082 const DirectoryLookup *LookupFrom) {
1083 // Save the location of the current token. If a '(' is later found, use
1084 // that location. If not, use the end of this location instead.
1085 SourceLocation LParenLoc = Tok.getLocation();
1086
1087 // These expressions are only allowed within a preprocessor directive.
1088 if (!PP.isParsingIfOrElifDirective()) {
1089 PP.Diag(LParenLoc, diag::err_pp_directive_required) << II->getName();
1090 return false;
1091 }
1092
1093 // Get '('.
1094 PP.LexNonComment(Tok);
1095
1096 // Ensure we have a '('.
1097 if (Tok.isNot(tok::l_paren)) {
1098 // No '(', use end of last token.
1099 LParenLoc = PP.getLocForEndOfToken(LParenLoc);
1100 PP.Diag(LParenLoc, diag::err_pp_missing_lparen) << II->getName();
1101 // If the next token looks like a filename or the start of one,
1102 // assume it is and process it as such.
1103 if (!Tok.is(tok::angle_string_literal) && !Tok.is(tok::string_literal) &&
1104 !Tok.is(tok::less))
1105 return false;
1106 } else {
1107 // Save '(' location for possible missing ')' message.
1108 LParenLoc = Tok.getLocation();
1109
1110 if (PP.getCurrentLexer()) {
1111 // Get the file name.
1112 PP.getCurrentLexer()->LexIncludeFilename(Tok);
1113 } else {
1114 // We're in a macro, so we can't use LexIncludeFilename; just
1115 // grab the next token.
1116 PP.Lex(Tok);
1117 }
1118 }
1119
1120 // Reserve a buffer to get the spelling.
1121 SmallString<128> FilenameBuffer;
1122 StringRef Filename;
1123 SourceLocation EndLoc;
1124
1125 switch (Tok.getKind()) {
1126 case tok::eod:
1127 // If the token kind is EOD, the error has already been diagnosed.
1128 return false;
1129
1130 case tok::angle_string_literal:
1131 case tok::string_literal: {
1132 bool Invalid = false;
1133 Filename = PP.getSpelling(Tok, FilenameBuffer, &Invalid);
1134 if (Invalid)
1135 return false;
1136 break;
1137 }
1138
1139 case tok::less:
1140 // This could be a <foo/bar.h> file coming from a macro expansion. In this
1141 // case, glue the tokens together into FilenameBuffer and interpret those.
1142 FilenameBuffer.push_back('<');
1143 if (PP.ConcatenateIncludeName(FilenameBuffer, EndLoc)) {
1144 // Let the caller know a <eod> was found by changing the Token kind.
1145 Tok.setKind(tok::eod);
1146 return false; // Found <eod> but no ">"? Diagnostic already emitted.
1147 }
1148 Filename = FilenameBuffer.str();
1149 break;
1150 default:
1151 PP.Diag(Tok.getLocation(), diag::err_pp_expects_filename);
1152 return false;
1153 }
1154
1155 SourceLocation FilenameLoc = Tok.getLocation();
1156
1157 // Get ')'.
1158 PP.LexNonComment(Tok);
1159
1160 // Ensure we have a trailing ).
1161 if (Tok.isNot(tok::r_paren)) {
1162 PP.Diag(PP.getLocForEndOfToken(FilenameLoc), diag::err_pp_missing_rparen)
1163 << II->getName();
1164 PP.Diag(LParenLoc, diag::note_matching) << "(";
1165 return false;
1166 }
1167
1168 bool isAngled = PP.GetIncludeFilenameSpelling(Tok.getLocation(), Filename);
1169 // If GetIncludeFilenameSpelling set the start ptr to null, there was an
1170 // error.
1171 if (Filename.empty())
1172 return false;
1173
1174 // Search include directories.
1175 const DirectoryLookup *CurDir;
1176 const FileEntry *File =
1177 PP.LookupFile(FilenameLoc, Filename, isAngled, LookupFrom, CurDir, NULL,
1178 NULL, NULL);
1179
1180 // Get the result value. A result of true means the file exists.
1181 return File != 0;
1182 }
1183
1184 /// EvaluateHasInclude - Process a '__has_include("path")' expression.
1185 /// Returns true if successful.
EvaluateHasInclude(Token & Tok,IdentifierInfo * II,Preprocessor & PP)1186 static bool EvaluateHasInclude(Token &Tok, IdentifierInfo *II,
1187 Preprocessor &PP) {
1188 return EvaluateHasIncludeCommon(Tok, II, PP, NULL);
1189 }
1190
1191 /// EvaluateHasIncludeNext - Process '__has_include_next("path")' expression.
1192 /// Returns true if successful.
EvaluateHasIncludeNext(Token & Tok,IdentifierInfo * II,Preprocessor & PP)1193 static bool EvaluateHasIncludeNext(Token &Tok,
1194 IdentifierInfo *II, Preprocessor &PP) {
1195 // __has_include_next is like __has_include, except that we start
1196 // searching after the current found directory. If we can't do this,
1197 // issue a diagnostic.
1198 const DirectoryLookup *Lookup = PP.GetCurDirLookup();
1199 if (PP.isInPrimaryFile()) {
1200 Lookup = 0;
1201 PP.Diag(Tok, diag::pp_include_next_in_primary);
1202 } else if (Lookup == 0) {
1203 PP.Diag(Tok, diag::pp_include_next_absolute_path);
1204 } else {
1205 // Start looking up in the next directory.
1206 ++Lookup;
1207 }
1208
1209 return EvaluateHasIncludeCommon(Tok, II, PP, Lookup);
1210 }
1211
1212 /// \brief Process __building_module(identifier) expression.
1213 /// \returns true if we are building the named module, false otherwise.
EvaluateBuildingModule(Token & Tok,IdentifierInfo * II,Preprocessor & PP)1214 static bool EvaluateBuildingModule(Token &Tok,
1215 IdentifierInfo *II, Preprocessor &PP) {
1216 // Get '('.
1217 PP.LexNonComment(Tok);
1218
1219 // Ensure we have a '('.
1220 if (Tok.isNot(tok::l_paren)) {
1221 PP.Diag(Tok.getLocation(), diag::err_pp_missing_lparen) << II->getName();
1222 return false;
1223 }
1224
1225 // Save '(' location for possible missing ')' message.
1226 SourceLocation LParenLoc = Tok.getLocation();
1227
1228 // Get the module name.
1229 PP.LexNonComment(Tok);
1230
1231 // Ensure that we have an identifier.
1232 if (Tok.isNot(tok::identifier)) {
1233 PP.Diag(Tok.getLocation(), diag::err_expected_id_building_module);
1234 return false;
1235 }
1236
1237 bool Result
1238 = Tok.getIdentifierInfo()->getName() == PP.getLangOpts().CurrentModule;
1239
1240 // Get ')'.
1241 PP.LexNonComment(Tok);
1242
1243 // Ensure we have a trailing ).
1244 if (Tok.isNot(tok::r_paren)) {
1245 PP.Diag(Tok.getLocation(), diag::err_pp_missing_rparen) << II->getName();
1246 PP.Diag(LParenLoc, diag::note_matching) << "(";
1247 return false;
1248 }
1249
1250 return Result;
1251 }
1252
1253 /// ExpandBuiltinMacro - If an identifier token is read that is to be expanded
1254 /// as a builtin macro, handle it and return the next token as 'Tok'.
ExpandBuiltinMacro(Token & Tok)1255 void Preprocessor::ExpandBuiltinMacro(Token &Tok) {
1256 // Figure out which token this is.
1257 IdentifierInfo *II = Tok.getIdentifierInfo();
1258 assert(II && "Can't be a macro without id info!");
1259
1260 // If this is an _Pragma or Microsoft __pragma directive, expand it,
1261 // invoke the pragma handler, then lex the token after it.
1262 if (II == Ident_Pragma)
1263 return Handle_Pragma(Tok);
1264 else if (II == Ident__pragma) // in non-MS mode this is null
1265 return HandleMicrosoft__pragma(Tok);
1266
1267 ++NumBuiltinMacroExpanded;
1268
1269 SmallString<128> TmpBuffer;
1270 llvm::raw_svector_ostream OS(TmpBuffer);
1271
1272 // Set up the return result.
1273 Tok.setIdentifierInfo(0);
1274 Tok.clearFlag(Token::NeedsCleaning);
1275
1276 if (II == Ident__LINE__) {
1277 // C99 6.10.8: "__LINE__: The presumed line number (within the current
1278 // source file) of the current source line (an integer constant)". This can
1279 // be affected by #line.
1280 SourceLocation Loc = Tok.getLocation();
1281
1282 // Advance to the location of the first _, this might not be the first byte
1283 // of the token if it starts with an escaped newline.
1284 Loc = AdvanceToTokenCharacter(Loc, 0);
1285
1286 // One wrinkle here is that GCC expands __LINE__ to location of the *end* of
1287 // a macro expansion. This doesn't matter for object-like macros, but
1288 // can matter for a function-like macro that expands to contain __LINE__.
1289 // Skip down through expansion points until we find a file loc for the
1290 // end of the expansion history.
1291 Loc = SourceMgr.getExpansionRange(Loc).second;
1292 PresumedLoc PLoc = SourceMgr.getPresumedLoc(Loc);
1293
1294 // __LINE__ expands to a simple numeric value.
1295 OS << (PLoc.isValid()? PLoc.getLine() : 1);
1296 Tok.setKind(tok::numeric_constant);
1297 } else if (II == Ident__FILE__ || II == Ident__BASE_FILE__) {
1298 // C99 6.10.8: "__FILE__: The presumed name of the current source file (a
1299 // character string literal)". This can be affected by #line.
1300 PresumedLoc PLoc = SourceMgr.getPresumedLoc(Tok.getLocation());
1301
1302 // __BASE_FILE__ is a GNU extension that returns the top of the presumed
1303 // #include stack instead of the current file.
1304 if (II == Ident__BASE_FILE__ && PLoc.isValid()) {
1305 SourceLocation NextLoc = PLoc.getIncludeLoc();
1306 while (NextLoc.isValid()) {
1307 PLoc = SourceMgr.getPresumedLoc(NextLoc);
1308 if (PLoc.isInvalid())
1309 break;
1310
1311 NextLoc = PLoc.getIncludeLoc();
1312 }
1313 }
1314
1315 // Escape this filename. Turn '\' -> '\\' '"' -> '\"'
1316 SmallString<128> FN;
1317 if (PLoc.isValid()) {
1318 FN += PLoc.getFilename();
1319 Lexer::Stringify(FN);
1320 OS << '"' << FN.str() << '"';
1321 }
1322 Tok.setKind(tok::string_literal);
1323 } else if (II == Ident__DATE__) {
1324 if (!DATELoc.isValid())
1325 ComputeDATE_TIME(DATELoc, TIMELoc, *this);
1326 Tok.setKind(tok::string_literal);
1327 Tok.setLength(strlen("\"Mmm dd yyyy\""));
1328 Tok.setLocation(SourceMgr.createExpansionLoc(DATELoc, Tok.getLocation(),
1329 Tok.getLocation(),
1330 Tok.getLength()));
1331 return;
1332 } else if (II == Ident__TIME__) {
1333 if (!TIMELoc.isValid())
1334 ComputeDATE_TIME(DATELoc, TIMELoc, *this);
1335 Tok.setKind(tok::string_literal);
1336 Tok.setLength(strlen("\"hh:mm:ss\""));
1337 Tok.setLocation(SourceMgr.createExpansionLoc(TIMELoc, Tok.getLocation(),
1338 Tok.getLocation(),
1339 Tok.getLength()));
1340 return;
1341 } else if (II == Ident__INCLUDE_LEVEL__) {
1342 // Compute the presumed include depth of this token. This can be affected
1343 // by GNU line markers.
1344 unsigned Depth = 0;
1345
1346 PresumedLoc PLoc = SourceMgr.getPresumedLoc(Tok.getLocation());
1347 if (PLoc.isValid()) {
1348 PLoc = SourceMgr.getPresumedLoc(PLoc.getIncludeLoc());
1349 for (; PLoc.isValid(); ++Depth)
1350 PLoc = SourceMgr.getPresumedLoc(PLoc.getIncludeLoc());
1351 }
1352
1353 // __INCLUDE_LEVEL__ expands to a simple numeric value.
1354 OS << Depth;
1355 Tok.setKind(tok::numeric_constant);
1356 } else if (II == Ident__TIMESTAMP__) {
1357 // MSVC, ICC, GCC, VisualAge C++ extension. The generated string should be
1358 // of the form "Ddd Mmm dd hh::mm::ss yyyy", which is returned by asctime.
1359
1360 // Get the file that we are lexing out of. If we're currently lexing from
1361 // a macro, dig into the include stack.
1362 const FileEntry *CurFile = 0;
1363 PreprocessorLexer *TheLexer = getCurrentFileLexer();
1364
1365 if (TheLexer)
1366 CurFile = SourceMgr.getFileEntryForID(TheLexer->getFileID());
1367
1368 const char *Result;
1369 if (CurFile) {
1370 time_t TT = CurFile->getModificationTime();
1371 struct tm *TM = localtime(&TT);
1372 Result = asctime(TM);
1373 } else {
1374 Result = "??? ??? ?? ??:??:?? ????\n";
1375 }
1376 // Surround the string with " and strip the trailing newline.
1377 OS << '"' << StringRef(Result, strlen(Result)-1) << '"';
1378 Tok.setKind(tok::string_literal);
1379 } else if (II == Ident__COUNTER__) {
1380 // __COUNTER__ expands to a simple numeric value.
1381 OS << CounterValue++;
1382 Tok.setKind(tok::numeric_constant);
1383 } else if (II == Ident__has_feature ||
1384 II == Ident__has_extension ||
1385 II == Ident__has_builtin ||
1386 II == Ident__has_attribute) {
1387 // The argument to these builtins should be a parenthesized identifier.
1388 SourceLocation StartLoc = Tok.getLocation();
1389
1390 bool IsValid = false;
1391 IdentifierInfo *FeatureII = 0;
1392
1393 // Read the '('.
1394 LexUnexpandedToken(Tok);
1395 if (Tok.is(tok::l_paren)) {
1396 // Read the identifier
1397 LexUnexpandedToken(Tok);
1398 if ((FeatureII = Tok.getIdentifierInfo())) {
1399 // Read the ')'.
1400 LexUnexpandedToken(Tok);
1401 if (Tok.is(tok::r_paren))
1402 IsValid = true;
1403 }
1404 }
1405
1406 bool Value = false;
1407 if (!IsValid)
1408 Diag(StartLoc, diag::err_feature_check_malformed);
1409 else if (II == Ident__has_builtin) {
1410 // Check for a builtin is trivial.
1411 Value = FeatureII->getBuiltinID() != 0;
1412 } else if (II == Ident__has_attribute)
1413 Value = HasAttribute(FeatureII);
1414 else if (II == Ident__has_extension)
1415 Value = HasExtension(*this, FeatureII);
1416 else {
1417 assert(II == Ident__has_feature && "Must be feature check");
1418 Value = HasFeature(*this, FeatureII);
1419 }
1420
1421 OS << (int)Value;
1422 if (IsValid)
1423 Tok.setKind(tok::numeric_constant);
1424 } else if (II == Ident__has_include ||
1425 II == Ident__has_include_next) {
1426 // The argument to these two builtins should be a parenthesized
1427 // file name string literal using angle brackets (<>) or
1428 // double-quotes ("").
1429 bool Value;
1430 if (II == Ident__has_include)
1431 Value = EvaluateHasInclude(Tok, II, *this);
1432 else
1433 Value = EvaluateHasIncludeNext(Tok, II, *this);
1434 OS << (int)Value;
1435 if (Tok.is(tok::r_paren))
1436 Tok.setKind(tok::numeric_constant);
1437 } else if (II == Ident__has_warning) {
1438 // The argument should be a parenthesized string literal.
1439 // The argument to these builtins should be a parenthesized identifier.
1440 SourceLocation StartLoc = Tok.getLocation();
1441 bool IsValid = false;
1442 bool Value = false;
1443 // Read the '('.
1444 LexUnexpandedToken(Tok);
1445 do {
1446 if (Tok.isNot(tok::l_paren)) {
1447 Diag(StartLoc, diag::err_warning_check_malformed);
1448 break;
1449 }
1450
1451 LexUnexpandedToken(Tok);
1452 std::string WarningName;
1453 SourceLocation StrStartLoc = Tok.getLocation();
1454 if (!FinishLexStringLiteral(Tok, WarningName, "'__has_warning'",
1455 /*MacroExpansion=*/false)) {
1456 // Eat tokens until ')'.
1457 while (Tok.isNot(tok::r_paren) && Tok.isNot(tok::eod) &&
1458 Tok.isNot(tok::eof))
1459 LexUnexpandedToken(Tok);
1460 break;
1461 }
1462
1463 // Is the end a ')'?
1464 if (!(IsValid = Tok.is(tok::r_paren))) {
1465 Diag(StartLoc, diag::err_warning_check_malformed);
1466 break;
1467 }
1468
1469 if (WarningName.size() < 3 || WarningName[0] != '-' ||
1470 WarningName[1] != 'W') {
1471 Diag(StrStartLoc, diag::warn_has_warning_invalid_option);
1472 break;
1473 }
1474
1475 // Finally, check if the warning flags maps to a diagnostic group.
1476 // We construct a SmallVector here to talk to getDiagnosticIDs().
1477 // Although we don't use the result, this isn't a hot path, and not
1478 // worth special casing.
1479 SmallVector<diag::kind, 10> Diags;
1480 Value = !getDiagnostics().getDiagnosticIDs()->
1481 getDiagnosticsInGroup(WarningName.substr(2), Diags);
1482 } while (false);
1483
1484 OS << (int)Value;
1485 if (IsValid)
1486 Tok.setKind(tok::numeric_constant);
1487 } else if (II == Ident__building_module) {
1488 // The argument to this builtin should be an identifier. The
1489 // builtin evaluates to 1 when that identifier names the module we are
1490 // currently building.
1491 OS << (int)EvaluateBuildingModule(Tok, II, *this);
1492 Tok.setKind(tok::numeric_constant);
1493 } else if (II == Ident__MODULE__) {
1494 // The current module as an identifier.
1495 OS << getLangOpts().CurrentModule;
1496 IdentifierInfo *ModuleII = getIdentifierInfo(getLangOpts().CurrentModule);
1497 Tok.setIdentifierInfo(ModuleII);
1498 Tok.setKind(ModuleII->getTokenID());
1499 } else {
1500 llvm_unreachable("Unknown identifier!");
1501 }
1502 CreateString(OS.str(), Tok, Tok.getLocation(), Tok.getLocation());
1503 }
1504
markMacroAsUsed(MacroInfo * MI)1505 void Preprocessor::markMacroAsUsed(MacroInfo *MI) {
1506 // If the 'used' status changed, and the macro requires 'unused' warning,
1507 // remove its SourceLocation from the warn-for-unused-macro locations.
1508 if (MI->isWarnIfUnused() && !MI->isUsed())
1509 WarnUnusedMacroLocs.erase(MI->getDefinitionLoc());
1510 MI->setIsUsed(true);
1511 }
1512