1 // Copyright 2012 the V8 project authors. All rights reserved. 2 // Use of this source code is governed by a BSD-style license that can be 3 // found in the LICENSE file. 4 5 #ifndef V8_PARSING_TOKEN_H_ 6 #define V8_PARSING_TOKEN_H_ 7 8 #include "src/base/logging.h" 9 #include "src/globals.h" 10 11 namespace v8 { 12 namespace internal { 13 14 // TOKEN_LIST takes a list of 3 macros M, all of which satisfy the 15 // same signature M(name, string, precedence), where name is the 16 // symbolic token name, string is the corresponding syntactic symbol 17 // (or NULL, for literals), and precedence is the precedence (or 0). 18 // The parameters are invoked for token categories as follows: 19 // 20 // T: Non-keyword tokens 21 // K: Keyword tokens 22 23 // IGNORE_TOKEN is a convenience macro that can be supplied as 24 // an argument (at any position) for a TOKEN_LIST call. It does 25 // nothing with tokens belonging to the respective category. 26 27 #define IGNORE_TOKEN(name, string, precedence) 28 29 #define TOKEN_LIST(T, K) \ 30 /* End of source indicator. */ \ 31 T(EOS, "EOS", 0) \ 32 \ 33 /* Punctuators (ECMA-262, section 7.7, page 15). */ \ 34 T(LPAREN, "(", 0) \ 35 T(RPAREN, ")", 0) \ 36 T(LBRACK, "[", 0) \ 37 T(RBRACK, "]", 0) \ 38 T(LBRACE, "{", 0) \ 39 T(RBRACE, "}", 0) \ 40 T(COLON, ":", 0) \ 41 T(SEMICOLON, ";", 0) \ 42 T(PERIOD, ".", 0) \ 43 T(ELLIPSIS, "...", 0) \ 44 T(CONDITIONAL, "?", 3) \ 45 T(INC, "++", 0) \ 46 T(DEC, "--", 0) \ 47 T(ARROW, "=>", 0) \ 48 \ 49 /* Assignment operators. */ \ 50 /* IsAssignmentOp() and Assignment::is_compound() relies on */ \ 51 /* this block of enum values being contiguous and sorted in the */ \ 52 /* same order! */ \ 53 T(INIT, "=init", 2) /* AST-use only. */ \ 54 T(ASSIGN, "=", 2) \ 55 T(ASSIGN_BIT_OR, "|=", 2) \ 56 T(ASSIGN_BIT_XOR, "^=", 2) \ 57 T(ASSIGN_BIT_AND, "&=", 2) \ 58 T(ASSIGN_SHL, "<<=", 2) \ 59 T(ASSIGN_SAR, ">>=", 2) \ 60 T(ASSIGN_SHR, ">>>=", 2) \ 61 T(ASSIGN_ADD, "+=", 2) \ 62 T(ASSIGN_SUB, "-=", 2) \ 63 T(ASSIGN_MUL, "*=", 2) \ 64 T(ASSIGN_DIV, "/=", 2) \ 65 T(ASSIGN_MOD, "%=", 2) \ 66 T(ASSIGN_EXP, "**=", 2) \ 67 \ 68 /* Binary operators sorted by precedence. */ \ 69 /* IsBinaryOp() relies on this block of enum values */ \ 70 /* being contiguous and sorted in the same order! */ \ 71 T(COMMA, ",", 1) \ 72 T(OR, "||", 4) \ 73 T(AND, "&&", 5) \ 74 T(BIT_OR, "|", 6) \ 75 T(BIT_XOR, "^", 7) \ 76 T(BIT_AND, "&", 8) \ 77 T(SHL, "<<", 11) \ 78 T(SAR, ">>", 11) \ 79 T(SHR, ">>>", 11) \ 80 T(ROR, "rotate right", 11) /* only used by Crankshaft */ \ 81 T(ADD, "+", 12) \ 82 T(SUB, "-", 12) \ 83 T(MUL, "*", 13) \ 84 T(DIV, "/", 13) \ 85 T(MOD, "%", 13) \ 86 T(EXP, "**", 14) \ 87 \ 88 /* Compare operators sorted by precedence. */ \ 89 /* IsCompareOp() relies on this block of enum values */ \ 90 /* being contiguous and sorted in the same order! */ \ 91 T(EQ, "==", 9) \ 92 T(NE, "!=", 9) \ 93 T(EQ_STRICT, "===", 9) \ 94 T(NE_STRICT, "!==", 9) \ 95 T(LT, "<", 10) \ 96 T(GT, ">", 10) \ 97 T(LTE, "<=", 10) \ 98 T(GTE, ">=", 10) \ 99 K(INSTANCEOF, "instanceof", 10) \ 100 K(IN, "in", 10) \ 101 \ 102 /* Unary operators. */ \ 103 /* IsUnaryOp() relies on this block of enum values */ \ 104 /* being contiguous and sorted in the same order! */ \ 105 T(NOT, "!", 0) \ 106 T(BIT_NOT, "~", 0) \ 107 K(DELETE, "delete", 0) \ 108 K(TYPEOF, "typeof", 0) \ 109 K(VOID, "void", 0) \ 110 \ 111 /* Keywords (ECMA-262, section 7.5.2, page 13). */ \ 112 K(BREAK, "break", 0) \ 113 K(CASE, "case", 0) \ 114 K(CATCH, "catch", 0) \ 115 K(CONTINUE, "continue", 0) \ 116 K(DEBUGGER, "debugger", 0) \ 117 K(DEFAULT, "default", 0) \ 118 /* DELETE */ \ 119 K(DO, "do", 0) \ 120 K(ELSE, "else", 0) \ 121 K(FINALLY, "finally", 0) \ 122 K(FOR, "for", 0) \ 123 K(FUNCTION, "function", 0) \ 124 K(IF, "if", 0) \ 125 /* IN */ \ 126 /* INSTANCEOF */ \ 127 K(NEW, "new", 0) \ 128 K(RETURN, "return", 0) \ 129 K(SWITCH, "switch", 0) \ 130 K(THIS, "this", 0) \ 131 K(THROW, "throw", 0) \ 132 K(TRY, "try", 0) \ 133 /* TYPEOF */ \ 134 K(VAR, "var", 0) \ 135 /* VOID */ \ 136 K(WHILE, "while", 0) \ 137 K(WITH, "with", 0) \ 138 \ 139 /* Literals (ECMA-262, section 7.8, page 16). */ \ 140 K(NULL_LITERAL, "null", 0) \ 141 K(TRUE_LITERAL, "true", 0) \ 142 K(FALSE_LITERAL, "false", 0) \ 143 T(NUMBER, NULL, 0) \ 144 T(SMI, NULL, 0) \ 145 T(STRING, NULL, 0) \ 146 \ 147 /* Identifiers (not keywords or future reserved words). */ \ 148 T(IDENTIFIER, NULL, 0) \ 149 \ 150 /* Future reserved words (ECMA-262, section 7.6.1.2). */ \ 151 T(FUTURE_STRICT_RESERVED_WORD, NULL, 0) \ 152 K(ASYNC, "async", 0) \ 153 /* `await` is a reserved word in module code only */ \ 154 K(AWAIT, "await", 0) \ 155 K(CLASS, "class", 0) \ 156 K(CONST, "const", 0) \ 157 K(ENUM, "enum", 0) \ 158 K(EXPORT, "export", 0) \ 159 K(EXTENDS, "extends", 0) \ 160 K(IMPORT, "import", 0) \ 161 K(LET, "let", 0) \ 162 K(STATIC, "static", 0) \ 163 K(YIELD, "yield", 0) \ 164 K(SUPER, "super", 0) \ 165 \ 166 /* Illegal token - not able to scan. */ \ 167 T(ILLEGAL, "ILLEGAL", 0) \ 168 T(ESCAPED_KEYWORD, NULL, 0) \ 169 T(ESCAPED_STRICT_RESERVED_WORD, NULL, 0) \ 170 \ 171 /* Scanner-internal use only. */ \ 172 T(WHITESPACE, NULL, 0) \ 173 T(UNINITIALIZED, NULL, 0) \ 174 T(REGEXP_LITERAL, NULL, 0) \ 175 \ 176 /* ES6 Template Literals */ \ 177 T(TEMPLATE_SPAN, NULL, 0) \ 178 T(TEMPLATE_TAIL, NULL, 0) 179 180 class Token { 181 public: 182 // All token values. 183 #define T(name, string, precedence) name, 184 enum Value { 185 TOKEN_LIST(T, T) 186 NUM_TOKENS 187 }; 188 #undef T 189 190 // Returns a string corresponding to the C++ token name 191 // (e.g. "LT" for the token LT). Name(Value tok)192 static const char* Name(Value tok) { 193 DCHECK(tok < NUM_TOKENS); // tok is unsigned 194 return name_[tok]; 195 } 196 197 // Predicates IsKeyword(Value tok)198 static bool IsKeyword(Value tok) { 199 return token_type[tok] == 'K'; 200 } 201 IsIdentifier(Value tok,LanguageMode language_mode,bool is_generator,bool disallow_await)202 static bool IsIdentifier(Value tok, LanguageMode language_mode, 203 bool is_generator, bool disallow_await) { 204 switch (tok) { 205 case IDENTIFIER: 206 case ASYNC: 207 return true; 208 case ESCAPED_STRICT_RESERVED_WORD: 209 case FUTURE_STRICT_RESERVED_WORD: 210 case LET: 211 case STATIC: 212 return is_sloppy(language_mode); 213 case YIELD: 214 return !is_generator && is_sloppy(language_mode); 215 case AWAIT: 216 return !disallow_await; 217 default: 218 return false; 219 } 220 UNREACHABLE(); 221 return false; 222 } 223 IsAssignmentOp(Value tok)224 static bool IsAssignmentOp(Value tok) { 225 return INIT <= tok && tok <= ASSIGN_EXP; 226 } 227 IsBinaryOp(Value op)228 static bool IsBinaryOp(Value op) { return COMMA <= op && op <= EXP; } 229 IsTruncatingBinaryOp(Value op)230 static bool IsTruncatingBinaryOp(Value op) { 231 return BIT_OR <= op && op <= ROR; 232 } 233 IsCompareOp(Value op)234 static bool IsCompareOp(Value op) { 235 return EQ <= op && op <= IN; 236 } 237 IsOrderedRelationalCompareOp(Value op)238 static bool IsOrderedRelationalCompareOp(Value op) { 239 return op == LT || op == LTE || op == GT || op == GTE; 240 } 241 IsEqualityOp(Value op)242 static bool IsEqualityOp(Value op) { 243 return op == EQ || op == EQ_STRICT; 244 } 245 IsInequalityOp(Value op)246 static bool IsInequalityOp(Value op) { 247 return op == NE || op == NE_STRICT; 248 } 249 IsArithmeticCompareOp(Value op)250 static bool IsArithmeticCompareOp(Value op) { 251 return IsOrderedRelationalCompareOp(op) || 252 IsEqualityOp(op) || IsInequalityOp(op); 253 } 254 NegateCompareOp(Value op)255 static Value NegateCompareOp(Value op) { 256 DCHECK(IsArithmeticCompareOp(op)); 257 switch (op) { 258 case EQ: return NE; 259 case NE: return EQ; 260 case EQ_STRICT: return NE_STRICT; 261 case NE_STRICT: return EQ_STRICT; 262 case LT: return GTE; 263 case GT: return LTE; 264 case LTE: return GT; 265 case GTE: return LT; 266 default: 267 UNREACHABLE(); 268 return op; 269 } 270 } 271 ReverseCompareOp(Value op)272 static Value ReverseCompareOp(Value op) { 273 DCHECK(IsArithmeticCompareOp(op)); 274 switch (op) { 275 case EQ: return EQ; 276 case NE: return NE; 277 case EQ_STRICT: return EQ_STRICT; 278 case NE_STRICT: return NE_STRICT; 279 case LT: return GT; 280 case GT: return LT; 281 case LTE: return GTE; 282 case GTE: return LTE; 283 default: 284 UNREACHABLE(); 285 return op; 286 } 287 } 288 EvalComparison(Value op,double op1,double op2)289 static bool EvalComparison(Value op, double op1, double op2) { 290 DCHECK(IsArithmeticCompareOp(op)); 291 switch (op) { 292 case Token::EQ: 293 case Token::EQ_STRICT: return (op1 == op2); 294 case Token::NE: return (op1 != op2); 295 case Token::LT: return (op1 < op2); 296 case Token::GT: return (op1 > op2); 297 case Token::LTE: return (op1 <= op2); 298 case Token::GTE: return (op1 >= op2); 299 default: 300 UNREACHABLE(); 301 return false; 302 } 303 } 304 IsBitOp(Value op)305 static bool IsBitOp(Value op) { 306 return (BIT_OR <= op && op <= SHR) || op == BIT_NOT; 307 } 308 IsUnaryOp(Value op)309 static bool IsUnaryOp(Value op) { 310 return (NOT <= op && op <= VOID) || op == ADD || op == SUB; 311 } 312 IsCountOp(Value op)313 static bool IsCountOp(Value op) { 314 return op == INC || op == DEC; 315 } 316 IsShiftOp(Value op)317 static bool IsShiftOp(Value op) { 318 return (SHL <= op) && (op <= SHR); 319 } 320 321 // Returns a string corresponding to the JS token string 322 // (.e., "<" for the token LT) or NULL if the token doesn't 323 // have a (unique) string (e.g. an IDENTIFIER). String(Value tok)324 static const char* String(Value tok) { 325 DCHECK(tok < NUM_TOKENS); // tok is unsigned. 326 return string_[tok]; 327 } 328 StringLength(Value tok)329 static uint8_t StringLength(Value tok) { 330 DCHECK(tok < NUM_TOKENS); 331 return string_length_[tok]; 332 } 333 334 // Returns the precedence > 0 for binary and compare 335 // operators; returns 0 otherwise. Precedence(Value tok)336 static int Precedence(Value tok) { 337 DCHECK(tok < NUM_TOKENS); // tok is unsigned. 338 return precedence_[tok]; 339 } 340 341 private: 342 static const char* const name_[NUM_TOKENS]; 343 static const char* const string_[NUM_TOKENS]; 344 static const uint8_t string_length_[NUM_TOKENS]; 345 static const int8_t precedence_[NUM_TOKENS]; 346 static const char token_type[NUM_TOKENS]; 347 }; 348 349 } // namespace internal 350 } // namespace v8 351 352 #endif // V8_PARSING_TOKEN_H_ 353