diff options
Diffstat (limited to 'deps/v8/src/char-predicates-inl.h')
-rw-r--r-- | deps/v8/src/char-predicates-inl.h | 97 |
1 files changed, 72 insertions, 25 deletions
diff --git a/deps/v8/src/char-predicates-inl.h b/deps/v8/src/char-predicates-inl.h index 3662514bca..329b3a0fbb 100644 --- a/deps/v8/src/char-predicates-inl.h +++ b/deps/v8/src/char-predicates-inl.h @@ -14,65 +14,112 @@ namespace internal { // If c is in 'A'-'Z' or 'a'-'z', return its lower-case. // Else, return something outside of 'A'-'Z' and 'a'-'z'. // Note: it ignores LOCALE. -inline int AsciiAlphaToLower(uc32 c) { - return c | 0x20; -} +inline constexpr int AsciiAlphaToLower(uc32 c) { return c | 0x20; } -inline bool IsCarriageReturn(uc32 c) { - return c == 0x000D; -} +inline constexpr bool IsCarriageReturn(uc32 c) { return c == 0x000D; } -inline bool IsLineFeed(uc32 c) { - return c == 0x000A; -} +inline constexpr bool IsLineFeed(uc32 c) { return c == 0x000A; } -inline bool IsAsciiIdentifier(uc32 c) { +inline constexpr bool IsAsciiIdentifier(uc32 c) { return IsAlphaNumeric(c) || c == '$' || c == '_'; } -inline bool IsAlphaNumeric(uc32 c) { +inline constexpr bool IsAlphaNumeric(uc32 c) { return IsInRange(AsciiAlphaToLower(c), 'a', 'z') || IsDecimalDigit(c); } -inline bool IsDecimalDigit(uc32 c) { +inline constexpr bool IsDecimalDigit(uc32 c) { // ECMA-262, 3rd, 7.8.3 (p 16) return IsInRange(c, '0', '9'); } -inline bool IsHexDigit(uc32 c) { +inline constexpr bool IsHexDigit(uc32 c) { // ECMA-262, 3rd, 7.6 (p 15) return IsDecimalDigit(c) || IsInRange(AsciiAlphaToLower(c), 'a', 'f'); } -inline bool IsOctalDigit(uc32 c) { +inline constexpr bool IsOctalDigit(uc32 c) { // ECMA-262, 6th, 7.8.3 return IsInRange(c, '0', '7'); } -inline bool IsNonOctalDecimalDigit(uc32 c) { return IsInRange(c, '8', '9'); } +inline constexpr bool IsNonOctalDecimalDigit(uc32 c) { + return IsInRange(c, '8', '9'); +} -inline bool IsBinaryDigit(uc32 c) { +inline constexpr bool IsBinaryDigit(uc32 c) { // ECMA-262, 6th, 7.8.3 return c == '0' || c == '1'; } -inline bool IsRegExpWord(uc16 c) { +inline constexpr bool IsRegExpWord(uc16 c) { return IsInRange(AsciiAlphaToLower(c), 'a', 'z') || IsDecimalDigit(c) || (c == '_'); } +inline constexpr bool IsRegExpNewline(uc16 c) { + // CR LF LS PS + return c != 0x000A && c != 0x000D && c != 0x2028 && c != 0x2029; +} -inline bool IsRegExpNewline(uc16 c) { - switch (c) { - // CR LF LS PS - case 0x000A: case 0x000D: case 0x2028: case 0x2029: - return false; - default: - return true; - } +// Constexpr cache table for character flags. +enum AsciiCharFlags { + kIsIdentifierStart = 1 << 0, + kIsIdentifierPart = 1 << 1, + kIsWhiteSpace = 1 << 2, + kIsWhiteSpaceOrLineTerminator = 1 << 3 +}; +constexpr uint8_t BuildAsciiCharFlags(uc32 c) { + // clang-format off + return + (IsAsciiIdentifier(c) || c == '\\') ? ( + kIsIdentifierPart | (!IsDecimalDigit(c) ? kIsIdentifierStart : 0)) : 0 | + (c == ' ' || c == '\t' || c == '\v' || c == '\f') ? + kIsWhiteSpace | kIsWhiteSpaceOrLineTerminator : 0 | + (c == '\r' || c == '\n') ? kIsWhiteSpaceOrLineTerminator : 0; + // clang-format on +} +const constexpr uint8_t kAsciiCharFlags[128] = { +#define BUILD_CHAR_FLAGS(N) BuildAsciiCharFlags(N), + INT_0_TO_127_LIST(BUILD_CHAR_FLAGS) +#undef BUILD_CHAR_FLAGS +}; + +bool IsIdentifierStart(uc32 c) { + if (!IsInRange(c, 0, 127)) return IsIdentifierStartSlow(c); + DCHECK_EQ(IsIdentifierStartSlow(c), + static_cast<bool>(kAsciiCharFlags[c] & kIsIdentifierStart)); + return kAsciiCharFlags[c] & kIsIdentifierStart; } +bool IsIdentifierPart(uc32 c) { + if (!IsInRange(c, 0, 127)) return IsIdentifierPartSlow(c); + DCHECK_EQ(IsIdentifierPartSlow(c), + static_cast<bool>(kAsciiCharFlags[c] & kIsIdentifierPart)); + return kAsciiCharFlags[c] & kIsIdentifierPart; +} + +bool IsWhiteSpace(uc32 c) { + if (!IsInRange(c, 0, 127)) return IsWhiteSpaceSlow(c); + DCHECK_EQ(IsWhiteSpaceSlow(c), + static_cast<bool>(kAsciiCharFlags[c] & kIsWhiteSpace)); + return kAsciiCharFlags[c] & kIsWhiteSpace; +} + +bool IsWhiteSpaceOrLineTerminator(uc32 c) { + if (!IsInRange(c, 0, 127)) return IsWhiteSpaceOrLineTerminatorSlow(c); + DCHECK_EQ( + IsWhiteSpaceOrLineTerminatorSlow(c), + static_cast<bool>(kAsciiCharFlags[c] & kIsWhiteSpaceOrLineTerminator)); + return kAsciiCharFlags[c] & kIsWhiteSpaceOrLineTerminator; +} + +bool IsLineTerminatorSequence(uc32 c, uc32 next) { + if (!unibrow::IsLineTerminator(c)) return false; + if (c == 0x000d && next == 0x000a) return false; // CR with following LF. + return true; +} } // namespace internal } // namespace v8 |