diff options
Diffstat (limited to 'deps/v8/src/strings/char-predicates-inl.h')
-rw-r--r-- | deps/v8/src/strings/char-predicates-inl.h | 125 |
1 files changed, 125 insertions, 0 deletions
diff --git a/deps/v8/src/strings/char-predicates-inl.h b/deps/v8/src/strings/char-predicates-inl.h new file mode 100644 index 0000000000..cdd8ddb4ea --- /dev/null +++ b/deps/v8/src/strings/char-predicates-inl.h @@ -0,0 +1,125 @@ +// Copyright 2011 the V8 project authors. All rights reserved. +// Use of this source code is governed by a BSD-style license that can be +// found in the LICENSE file. + +#ifndef V8_STRINGS_CHAR_PREDICATES_INL_H_ +#define V8_STRINGS_CHAR_PREDICATES_INL_H_ + +#include "src/strings/char-predicates.h" + +namespace v8 { +namespace internal { + +// If c is in 'A'-'Z' or 'a'-'z', return its lower-case. +// Else, return something outside of 'A'-'Z' and 'a'-'z'. +// Note: it ignores LOCALE. +inline constexpr int AsciiAlphaToLower(uc32 c) { return c | 0x20; } + +inline constexpr bool IsCarriageReturn(uc32 c) { return c == 0x000D; } + +inline constexpr bool IsLineFeed(uc32 c) { return c == 0x000A; } + +inline constexpr bool IsAsciiIdentifier(uc32 c) { + return IsAlphaNumeric(c) || c == '$' || c == '_'; +} + +inline constexpr bool IsAlphaNumeric(uc32 c) { + return IsInRange(AsciiAlphaToLower(c), 'a', 'z') || IsDecimalDigit(c); +} + +inline constexpr bool IsDecimalDigit(uc32 c) { + // ECMA-262, 3rd, 7.8.3 (p 16) + return IsInRange(c, '0', '9'); +} + +inline constexpr bool IsHexDigit(uc32 c) { + // ECMA-262, 3rd, 7.6 (p 15) + return IsDecimalDigit(c) || IsInRange(AsciiAlphaToLower(c), 'a', 'f'); +} + +inline constexpr bool IsOctalDigit(uc32 c) { + // ECMA-262, 6th, 7.8.3 + return IsInRange(c, '0', '7'); +} + +inline constexpr bool IsNonOctalDecimalDigit(uc32 c) { + return IsInRange(c, '8', '9'); +} + +inline constexpr bool IsBinaryDigit(uc32 c) { + // ECMA-262, 6th, 7.8.3 + return c == '0' || c == '1'; +} + +inline constexpr bool IsRegExpWord(uc16 c) { + return IsInRange(AsciiAlphaToLower(c), 'a', 'z') || IsDecimalDigit(c) || + (c == '_'); +} + +inline constexpr bool IsRegExpNewline(uc16 c) { + // CR LF LS PS + return c != 0x000A && c != 0x000D && c != 0x2028 && c != 0x2029; +} + +// Constexpr cache table for character flags. +enum AsciiCharFlags { + kIsIdentifierStart = 1 << 0, + kIsIdentifierPart = 1 << 1, + kIsWhiteSpace = 1 << 2, + kIsWhiteSpaceOrLineTerminator = 1 << 3 +}; +constexpr uint8_t BuildAsciiCharFlags(uc32 c) { + // clang-format off + return + (IsAsciiIdentifier(c) || c == '\\') ? ( + kIsIdentifierPart | (!IsDecimalDigit(c) ? kIsIdentifierStart : 0)) : 0 | + (c == ' ' || c == '\t' || c == '\v' || c == '\f') ? + kIsWhiteSpace | kIsWhiteSpaceOrLineTerminator : 0 | + (c == '\r' || c == '\n') ? kIsWhiteSpaceOrLineTerminator : 0; + // clang-format on +} +const constexpr uint8_t kAsciiCharFlags[128] = { +#define BUILD_CHAR_FLAGS(N) BuildAsciiCharFlags(N), + INT_0_TO_127_LIST(BUILD_CHAR_FLAGS) +#undef BUILD_CHAR_FLAGS +}; + +bool IsIdentifierStart(uc32 c) { + if (!IsInRange(c, 0, 127)) return IsIdentifierStartSlow(c); + DCHECK_EQ(IsIdentifierStartSlow(c), + static_cast<bool>(kAsciiCharFlags[c] & kIsIdentifierStart)); + return kAsciiCharFlags[c] & kIsIdentifierStart; +} + +bool IsIdentifierPart(uc32 c) { + if (!IsInRange(c, 0, 127)) return IsIdentifierPartSlow(c); + DCHECK_EQ(IsIdentifierPartSlow(c), + static_cast<bool>(kAsciiCharFlags[c] & kIsIdentifierPart)); + return kAsciiCharFlags[c] & kIsIdentifierPart; +} + +bool IsWhiteSpace(uc32 c) { + if (!IsInRange(c, 0, 127)) return IsWhiteSpaceSlow(c); + DCHECK_EQ(IsWhiteSpaceSlow(c), + static_cast<bool>(kAsciiCharFlags[c] & kIsWhiteSpace)); + return kAsciiCharFlags[c] & kIsWhiteSpace; +} + +bool IsWhiteSpaceOrLineTerminator(uc32 c) { + if (!IsInRange(c, 0, 127)) return IsWhiteSpaceOrLineTerminatorSlow(c); + DCHECK_EQ( + IsWhiteSpaceOrLineTerminatorSlow(c), + static_cast<bool>(kAsciiCharFlags[c] & kIsWhiteSpaceOrLineTerminator)); + return kAsciiCharFlags[c] & kIsWhiteSpaceOrLineTerminator; +} + +bool IsLineTerminatorSequence(uc32 c, uc32 next) { + if (!unibrow::IsLineTerminator(c)) return false; + if (c == 0x000d && next == 0x000a) return false; // CR with following LF. + return true; +} + +} // namespace internal +} // namespace v8 + +#endif // V8_STRINGS_CHAR_PREDICATES_INL_H_ |