blob: 6511c6a42e4a40c560744576f804945385228cc3 [file] [log] [blame]
// Copyright 2014 the V8 project authors. All rights reserved.
// Use of this source code is governed by a BSD-style license that can be
// found in the LICENSE file.
#include "src/strings/char-predicates.h"
#include "src/strings/char-predicates-inl.h"
#include "src/strings/unicode.h"
#include "testing/gtest/include/gtest/gtest.h"
namespace v8 {
namespace internal {
TEST(CharPredicatesTest, WhiteSpace) {
EXPECT_TRUE(IsWhiteSpace(0x0009));
EXPECT_TRUE(IsWhiteSpace(0x000B));
EXPECT_TRUE(IsWhiteSpace(0x000C));
EXPECT_TRUE(IsWhiteSpace(' '));
EXPECT_TRUE(IsWhiteSpace(0x00A0));
EXPECT_TRUE(IsWhiteSpace(0x1680));
EXPECT_TRUE(IsWhiteSpace(0x2000));
EXPECT_TRUE(IsWhiteSpace(0x2007));
EXPECT_TRUE(IsWhiteSpace(0x202F));
EXPECT_TRUE(IsWhiteSpace(0x205F));
EXPECT_TRUE(IsWhiteSpace(0x3000));
EXPECT_TRUE(IsWhiteSpace(0xFEFF));
EXPECT_FALSE(IsWhiteSpace(0x180E));
}
TEST(CharPredicatesTest, WhiteSpaceOrLineTerminator) {
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x0009));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x000B));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x000C));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(' '));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x00A0));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x1680));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x2000));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x2007));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x202F));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x205F));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0xFEFF));
// Line terminators
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x000A));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x000D));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x2028));
EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x2029));
EXPECT_FALSE(IsWhiteSpaceOrLineTerminator(0x180E));
}
TEST(CharPredicatesTest, IdentifierStart) {
EXPECT_TRUE(IsIdentifierStart('$'));
EXPECT_TRUE(IsIdentifierStart('_'));
EXPECT_TRUE(IsIdentifierStart('\\'));
// http://www.unicode.org/reports/tr31/
// curl http://www.unicode.org/Public/UCD/latest/ucd/PropList.txt |
// grep 'Other_ID_Start'
// Other_ID_Start
EXPECT_TRUE(IsIdentifierStart(0x1885));
EXPECT_TRUE(IsIdentifierStart(0x1886));
EXPECT_TRUE(IsIdentifierStart(0x2118));
EXPECT_TRUE(IsIdentifierStart(0x212E));
EXPECT_TRUE(IsIdentifierStart(0x309B));
EXPECT_TRUE(IsIdentifierStart(0x309C));
// Issue 2892:
// \u2E2F has the Pattern_Syntax property, excluding it from ID_Start.
EXPECT_FALSE(IsIdentifierStart(0x2E2F));
#ifdef V8_INTL_SUPPORT
// New in Unicode 8.0 (6,847 code points)
// [:ID_Start:] & [[:Age=8.0:] - [:Age=7.0:]]
EXPECT_TRUE(IsIdentifierStart(0x08B3));
EXPECT_TRUE(IsIdentifierStart(0x0AF9));
EXPECT_TRUE(IsIdentifierStart(0x13F8));
EXPECT_TRUE(IsIdentifierStart(0x9FCD));
EXPECT_TRUE(IsIdentifierStart(0xAB60));
EXPECT_TRUE(IsIdentifierStart(0x10CC0));
EXPECT_TRUE(IsIdentifierStart(0x108E0));
EXPECT_TRUE(IsIdentifierStart(0x2B820));
// New in Unicode 9.0 (7,177 code points)
// [:ID_Start:] & [[:Age=9.0:] - [:Age=8.0:]]
EXPECT_TRUE(IsIdentifierStart(0x1C80));
EXPECT_TRUE(IsIdentifierStart(0x104DB));
EXPECT_TRUE(IsIdentifierStart(0x1E922));
#endif
}
TEST(CharPredicatesTest, IdentifierPart) {
EXPECT_TRUE(IsIdentifierPart('$'));
EXPECT_TRUE(IsIdentifierPart('_'));
EXPECT_TRUE(IsIdentifierPart('\\'));
EXPECT_TRUE(IsIdentifierPart(0x200C));
EXPECT_TRUE(IsIdentifierPart(0x200D));
#ifdef V8_INTL_SUPPORT
// New in Unicode 8.0 (6,847 code points)
// [:ID_Start:] & [[:Age=8.0:] - [:Age=7.0:]]
EXPECT_TRUE(IsIdentifierPart(0x08B3));
EXPECT_TRUE(IsIdentifierPart(0x0AF9));
EXPECT_TRUE(IsIdentifierPart(0x13F8));
EXPECT_TRUE(IsIdentifierPart(0x9FCD));
EXPECT_TRUE(IsIdentifierPart(0xAB60));
EXPECT_TRUE(IsIdentifierPart(0x10CC0));
EXPECT_TRUE(IsIdentifierPart(0x108E0));
EXPECT_TRUE(IsIdentifierPart(0x2B820));
// [[:ID_Continue:]-[:ID_Start:]] & [[:Age=8.0:]-[:Age=7.0:]]
// 162 code points
EXPECT_TRUE(IsIdentifierPart(0x08E3));
EXPECT_TRUE(IsIdentifierPart(0xA69E));
EXPECT_TRUE(IsIdentifierPart(0x11730));
// New in Unicode 9.0 (7,177 code points)
// [:ID_Start:] & [[:Age=9.0:] - [:Age=8.0:]]
EXPECT_TRUE(IsIdentifierPart(0x1C80));
EXPECT_TRUE(IsIdentifierPart(0x104DB));
EXPECT_TRUE(IsIdentifierPart(0x1E922));
// [[:ID_Continue:]-[:ID_Start:]] & [[:Age=9.0:]-[:Age=8.0:]]
// 162 code points
EXPECT_TRUE(IsIdentifierPart(0x08D4));
EXPECT_TRUE(IsIdentifierPart(0x1DFB));
EXPECT_TRUE(IsIdentifierPart(0xA8C5));
EXPECT_TRUE(IsIdentifierPart(0x11450));
#endif
// http://www.unicode.org/reports/tr31/
// curl http://www.unicode.org/Public/UCD/latest/ucd/PropList.txt |
// grep 'Other_ID_(Continue|Start)'
// Other_ID_Start
EXPECT_TRUE(IsIdentifierPart(0x1885));
EXPECT_TRUE(IsIdentifierPart(0x1886));
EXPECT_TRUE(IsIdentifierPart(0x2118));
EXPECT_TRUE(IsIdentifierPart(0x212E));
EXPECT_TRUE(IsIdentifierPart(0x309B));
EXPECT_TRUE(IsIdentifierPart(0x309C));
// Other_ID_Continue
EXPECT_TRUE(IsIdentifierPart(0x00B7));
EXPECT_TRUE(IsIdentifierPart(0x0387));
EXPECT_TRUE(IsIdentifierPart(0x1369));
EXPECT_TRUE(IsIdentifierPart(0x1370));
EXPECT_TRUE(IsIdentifierPart(0x1371));
EXPECT_TRUE(IsIdentifierPart(0x19DA));
// Issue 2892:
// \u2E2F has the Pattern_Syntax property, excluding it from ID_Start.
EXPECT_FALSE(IsIdentifierPart(0x2E2F));
}
#ifdef V8_INTL_SUPPORT
TEST(CharPredicatesTest, SupplementaryPlaneIdentifiers) {
// Both ID_Start and ID_Continue.
EXPECT_TRUE(IsIdentifierStart(0x10403)); // Category Lu
EXPECT_TRUE(IsIdentifierPart(0x10403));
EXPECT_TRUE(IsIdentifierStart(0x1043C)); // Category Ll
EXPECT_TRUE(IsIdentifierPart(0x1043C));
EXPECT_TRUE(IsIdentifierStart(0x16F9C)); // Category Lm
EXPECT_TRUE(IsIdentifierPart(0x16F9C));
EXPECT_TRUE(IsIdentifierStart(0x10048)); // Category Lo
EXPECT_TRUE(IsIdentifierPart(0x10048));
EXPECT_TRUE(IsIdentifierStart(0x1014D)); // Category Nl
EXPECT_TRUE(IsIdentifierPart(0x1014D));
// New in Unicode 8.0
// [ [:ID_Start=Yes:] & [:Age=8.0:]] - [:Age=7.0:]
EXPECT_TRUE(IsIdentifierStart(0x108E0));
EXPECT_TRUE(IsIdentifierStart(0x10C80));
// Only ID_Continue.
EXPECT_FALSE(IsIdentifierStart(0x101FD)); // Category Mn
EXPECT_TRUE(IsIdentifierPart(0x101FD));
EXPECT_FALSE(IsIdentifierStart(0x11002)); // Category Mc
EXPECT_TRUE(IsIdentifierPart(0x11002));
EXPECT_FALSE(IsIdentifierStart(0x104A9)); // Category Nd
EXPECT_TRUE(IsIdentifierPart(0x104A9));
// Neither.
EXPECT_FALSE(IsIdentifierStart(0x10111)); // Category No
EXPECT_FALSE(IsIdentifierPart(0x10111));
EXPECT_FALSE(IsIdentifierStart(0x1F4A9)); // Category So
EXPECT_FALSE(IsIdentifierPart(0x1F4A9));
}
#endif // V8_INTL_SUPPORT
} // namespace internal
} // namespace v8