4aeb94a42d
Use ICU to check ID_Start, ID_Continue and WhiteSpace even for BMP when V8_INTL_SUPPORT is on (which is default). Change LineTerminator::Is() to check 4 code points from ES#sec-line-terminators instead of using tables and Lookup function. Remove Lowercase::Is(). It's not used anywhere. Update webkit/{ToNumber,parseFloat}.js to have the correct expectation for U+180E and the corresponding expected files. This is a follow-up to an earlier change ( https://codereview.chromium.org/2720953003 ). CQ_INCLUDE_TRYBOTS=master.tryserver.v8:v8_win_dbg,v8_mac_dbg;master.tryserver.chromium.android:android_arm64_dbg_recipe CQ_INCLUDE_TRYBOTS=master.tryserver.v8:v8_linux_noi18n_rel_ng BUG=v8:5370,v8:5155 TEST=unittests --gtest_filter=CharP* TEST=webkit: ToNumber, parseFloat TEST=test262: built-ins/Number/S9.3*, built-ins/parse{Int,Float}/S15* TEST=test262: language/white-space/mong* TEST=test262: built-ins/String/prototype/trim/u180e TEST=mjsunit: whitespaces Review-Url: https://codereview.chromium.org/2331303002 Cr-Commit-Position: refs/heads/master@{#45957}
91 lines
2.7 KiB
C++
91 lines
2.7 KiB
C++
// Copyright 2011 the V8 project authors. All rights reserved.
|
|
// Use of this source code is governed by a BSD-style license that can be
|
|
// found in the LICENSE file.
|
|
|
|
#ifndef V8_CHAR_PREDICATES_H_
|
|
#define V8_CHAR_PREDICATES_H_
|
|
|
|
#include "src/globals.h"
|
|
#include "src/unicode.h"
|
|
|
|
namespace v8 {
|
|
namespace internal {
|
|
|
|
// Unicode character predicates as defined by ECMA-262, 3rd,
|
|
// used for lexical analysis.
|
|
|
|
inline int AsciiAlphaToLower(uc32 c);
|
|
inline bool IsCarriageReturn(uc32 c);
|
|
inline bool IsLineFeed(uc32 c);
|
|
inline bool IsAsciiIdentifier(uc32 c);
|
|
inline bool IsAlphaNumeric(uc32 c);
|
|
inline bool IsDecimalDigit(uc32 c);
|
|
inline bool IsHexDigit(uc32 c);
|
|
inline bool IsOctalDigit(uc32 c);
|
|
inline bool IsBinaryDigit(uc32 c);
|
|
inline bool IsRegExpWord(uc32 c);
|
|
inline bool IsRegExpNewline(uc32 c);
|
|
|
|
// ES#sec-names-and-keywords
|
|
// This includes '_', '$' and '\', and ID_Start according to
|
|
// http://www.unicode.org/reports/tr31/, which consists of categories
|
|
// 'Lu', 'Ll', 'Lt', 'Lm', 'Lo', 'Nl', but excluding properties
|
|
// 'Pattern_Syntax' or 'Pattern_White_Space'.
|
|
#ifdef V8_INTL_SUPPORT
|
|
struct V8_EXPORT_PRIVATE IdentifierStart {
|
|
static bool Is(uc32 c);
|
|
#else
|
|
struct IdentifierStart {
|
|
// Non-BMP characters are not supported without I18N.
|
|
static inline bool Is(uc32 c) {
|
|
return (c <= 0xFFFF) ? unibrow::ID_Start::Is(c) : false;
|
|
}
|
|
#endif
|
|
};
|
|
|
|
// ES#sec-names-and-keywords
|
|
// This includes \u200c and \u200d, and ID_Continue according to
|
|
// http://www.unicode.org/reports/tr31/, which consists of ID_Start,
|
|
// the categories 'Mn', 'Mc', 'Nd', 'Pc', but excluding properties
|
|
// 'Pattern_Syntax' or 'Pattern_White_Space'.
|
|
#ifdef V8_INTL_SUPPORT
|
|
struct V8_EXPORT_PRIVATE IdentifierPart {
|
|
static bool Is(uc32 c);
|
|
#else
|
|
struct IdentifierPart {
|
|
static inline bool Is(uc32 c) {
|
|
// Non-BMP charaacters are not supported without I18N.
|
|
if (c <= 0xFFFF) {
|
|
return unibrow::ID_Start::Is(c) || unibrow::ID_Continue::Is(c);
|
|
}
|
|
return false;
|
|
}
|
|
#endif
|
|
};
|
|
|
|
// ES6 draft section 11.2
|
|
// This includes all code points of Unicode category 'Zs'.
|
|
// Further included are \u0009, \u000b, \u000c, and \ufeff.
|
|
#ifdef V8_INTL_SUPPORT
|
|
struct V8_EXPORT_PRIVATE WhiteSpace {
|
|
static bool Is(uc32 c);
|
|
#else
|
|
struct WhiteSpace {
|
|
static inline bool Is(uc32 c) { return unibrow::WhiteSpace::Is(c); }
|
|
#endif
|
|
};
|
|
|
|
// WhiteSpace and LineTerminator according to ES6 draft section 11.2 and 11.3
|
|
// This includes all the characters with Unicode category 'Z' (= Zs+Zl+Zp)
|
|
// as well as \u0009 - \u000d and \ufeff.
|
|
struct WhiteSpaceOrLineTerminator {
|
|
static inline bool Is(uc32 c) {
|
|
return WhiteSpace::Is(c) || unibrow::LineTerminator::Is(c);
|
|
}
|
|
};
|
|
|
|
} // namespace internal
|
|
} // namespace v8
|
|
|
|
#endif // V8_CHAR_PREDICATES_H_
|