| // Copyright 2014 the V8 project authors. All rights reserved. |
| // Use of this source code is governed by a BSD-style license that can be |
| // found in the LICENSE file. |
| |
| #include "src/strings/char-predicates.h" |
| #include "src/strings/char-predicates-inl.h" |
| #include "src/strings/unicode.h" |
| #include "testing/gtest/include/gtest/gtest.h" |
| |
| namespace v8 { |
| namespace internal { |
| |
| TEST(CharPredicatesTest, WhiteSpace) { |
| EXPECT_TRUE(IsWhiteSpace(0x0009)); |
| EXPECT_TRUE(IsWhiteSpace(0x000B)); |
| EXPECT_TRUE(IsWhiteSpace(0x000C)); |
| EXPECT_TRUE(IsWhiteSpace(' ')); |
| EXPECT_TRUE(IsWhiteSpace(0x00A0)); |
| EXPECT_TRUE(IsWhiteSpace(0x1680)); |
| EXPECT_TRUE(IsWhiteSpace(0x2000)); |
| EXPECT_TRUE(IsWhiteSpace(0x2007)); |
| EXPECT_TRUE(IsWhiteSpace(0x202F)); |
| EXPECT_TRUE(IsWhiteSpace(0x205F)); |
| EXPECT_TRUE(IsWhiteSpace(0x3000)); |
| EXPECT_TRUE(IsWhiteSpace(0xFEFF)); |
| EXPECT_FALSE(IsWhiteSpace(0x180E)); |
| } |
| |
| TEST(CharPredicatesTest, WhiteSpaceOrLineTerminator) { |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x0009)); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x000B)); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x000C)); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(' ')); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x00A0)); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x1680)); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x2000)); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x2007)); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x202F)); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x205F)); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0xFEFF)); |
| // Line terminators |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x000A)); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x000D)); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x2028)); |
| EXPECT_TRUE(IsWhiteSpaceOrLineTerminator(0x2029)); |
| EXPECT_FALSE(IsWhiteSpaceOrLineTerminator(0x180E)); |
| } |
| |
| TEST(CharPredicatesTest, IdentifierStart) { |
| EXPECT_TRUE(IsIdentifierStart('$')); |
| EXPECT_TRUE(IsIdentifierStart('_')); |
| EXPECT_TRUE(IsIdentifierStart('\\')); |
| |
| // http://www.unicode.org/reports/tr31/ |
| // curl http://www.unicode.org/Public/UCD/latest/ucd/PropList.txt | |
| // grep 'Other_ID_Start' |
| // Other_ID_Start |
| EXPECT_TRUE(IsIdentifierStart(0x1885)); |
| EXPECT_TRUE(IsIdentifierStart(0x1886)); |
| EXPECT_TRUE(IsIdentifierStart(0x2118)); |
| EXPECT_TRUE(IsIdentifierStart(0x212E)); |
| EXPECT_TRUE(IsIdentifierStart(0x309B)); |
| EXPECT_TRUE(IsIdentifierStart(0x309C)); |
| |
| // Issue 2892: |
| // \u2E2F has the Pattern_Syntax property, excluding it from ID_Start. |
| EXPECT_FALSE(IsIdentifierStart(0x2E2F)); |
| |
| #ifdef V8_INTL_SUPPORT |
| // New in Unicode 8.0 (6,847 code points) |
| // [:ID_Start:] & [[:Age=8.0:] - [:Age=7.0:]] |
| EXPECT_TRUE(IsIdentifierStart(0x08B3)); |
| EXPECT_TRUE(IsIdentifierStart(0x0AF9)); |
| EXPECT_TRUE(IsIdentifierStart(0x13F8)); |
| EXPECT_TRUE(IsIdentifierStart(0x9FCD)); |
| EXPECT_TRUE(IsIdentifierStart(0xAB60)); |
| EXPECT_TRUE(IsIdentifierStart(0x10CC0)); |
| EXPECT_TRUE(IsIdentifierStart(0x108E0)); |
| EXPECT_TRUE(IsIdentifierStart(0x2B820)); |
| |
| // New in Unicode 9.0 (7,177 code points) |
| // [:ID_Start:] & [[:Age=9.0:] - [:Age=8.0:]] |
| |
| EXPECT_TRUE(IsIdentifierStart(0x1C80)); |
| EXPECT_TRUE(IsIdentifierStart(0x104DB)); |
| EXPECT_TRUE(IsIdentifierStart(0x1E922)); |
| #endif |
| } |
| |
| TEST(CharPredicatesTest, IdentifierPart) { |
| EXPECT_TRUE(IsIdentifierPart('$')); |
| EXPECT_TRUE(IsIdentifierPart('_')); |
| EXPECT_TRUE(IsIdentifierPart('\\')); |
| EXPECT_TRUE(IsIdentifierPart(0x200C)); |
| EXPECT_TRUE(IsIdentifierPart(0x200D)); |
| |
| #ifdef V8_INTL_SUPPORT |
| // New in Unicode 8.0 (6,847 code points) |
| // [:ID_Start:] & [[:Age=8.0:] - [:Age=7.0:]] |
| EXPECT_TRUE(IsIdentifierPart(0x08B3)); |
| EXPECT_TRUE(IsIdentifierPart(0x0AF9)); |
| EXPECT_TRUE(IsIdentifierPart(0x13F8)); |
| EXPECT_TRUE(IsIdentifierPart(0x9FCD)); |
| EXPECT_TRUE(IsIdentifierPart(0xAB60)); |
| EXPECT_TRUE(IsIdentifierPart(0x10CC0)); |
| EXPECT_TRUE(IsIdentifierPart(0x108E0)); |
| EXPECT_TRUE(IsIdentifierPart(0x2B820)); |
| |
| // [[:ID_Continue:]-[:ID_Start:]] & [[:Age=8.0:]-[:Age=7.0:]] |
| // 162 code points |
| EXPECT_TRUE(IsIdentifierPart(0x08E3)); |
| EXPECT_TRUE(IsIdentifierPart(0xA69E)); |
| EXPECT_TRUE(IsIdentifierPart(0x11730)); |
| |
| // New in Unicode 9.0 (7,177 code points) |
| // [:ID_Start:] & [[:Age=9.0:] - [:Age=8.0:]] |
| EXPECT_TRUE(IsIdentifierPart(0x1C80)); |
| EXPECT_TRUE(IsIdentifierPart(0x104DB)); |
| EXPECT_TRUE(IsIdentifierPart(0x1E922)); |
| |
| // [[:ID_Continue:]-[:ID_Start:]] & [[:Age=9.0:]-[:Age=8.0:]] |
| // 162 code points |
| EXPECT_TRUE(IsIdentifierPart(0x08D4)); |
| EXPECT_TRUE(IsIdentifierPart(0x1DFB)); |
| EXPECT_TRUE(IsIdentifierPart(0xA8C5)); |
| EXPECT_TRUE(IsIdentifierPart(0x11450)); |
| #endif |
| |
| // http://www.unicode.org/reports/tr31/ |
| // curl http://www.unicode.org/Public/UCD/latest/ucd/PropList.txt | |
| // grep 'Other_ID_(Continue|Start)' |
| |
| // Other_ID_Start |
| EXPECT_TRUE(IsIdentifierPart(0x1885)); |
| EXPECT_TRUE(IsIdentifierPart(0x1886)); |
| EXPECT_TRUE(IsIdentifierPart(0x2118)); |
| EXPECT_TRUE(IsIdentifierPart(0x212E)); |
| EXPECT_TRUE(IsIdentifierPart(0x309B)); |
| EXPECT_TRUE(IsIdentifierPart(0x309C)); |
| |
| // Other_ID_Continue |
| EXPECT_TRUE(IsIdentifierPart(0x00B7)); |
| EXPECT_TRUE(IsIdentifierPart(0x0387)); |
| EXPECT_TRUE(IsIdentifierPart(0x1369)); |
| EXPECT_TRUE(IsIdentifierPart(0x1370)); |
| EXPECT_TRUE(IsIdentifierPart(0x1371)); |
| EXPECT_TRUE(IsIdentifierPart(0x19DA)); |
| |
| // Issue 2892: |
| // \u2E2F has the Pattern_Syntax property, excluding it from ID_Start. |
| EXPECT_FALSE(IsIdentifierPart(0x2E2F)); |
| } |
| |
| #ifdef V8_INTL_SUPPORT |
| TEST(CharPredicatesTest, SupplementaryPlaneIdentifiers) { |
| // Both ID_Start and ID_Continue. |
| EXPECT_TRUE(IsIdentifierStart(0x10403)); // Category Lu |
| EXPECT_TRUE(IsIdentifierPart(0x10403)); |
| EXPECT_TRUE(IsIdentifierStart(0x1043C)); // Category Ll |
| EXPECT_TRUE(IsIdentifierPart(0x1043C)); |
| EXPECT_TRUE(IsIdentifierStart(0x16F9C)); // Category Lm |
| EXPECT_TRUE(IsIdentifierPart(0x16F9C)); |
| EXPECT_TRUE(IsIdentifierStart(0x10048)); // Category Lo |
| EXPECT_TRUE(IsIdentifierPart(0x10048)); |
| EXPECT_TRUE(IsIdentifierStart(0x1014D)); // Category Nl |
| EXPECT_TRUE(IsIdentifierPart(0x1014D)); |
| |
| // New in Unicode 8.0 |
| // [ [:ID_Start=Yes:] & [:Age=8.0:]] - [:Age=7.0:] |
| EXPECT_TRUE(IsIdentifierStart(0x108E0)); |
| EXPECT_TRUE(IsIdentifierStart(0x10C80)); |
| |
| // Only ID_Continue. |
| EXPECT_FALSE(IsIdentifierStart(0x101FD)); // Category Mn |
| EXPECT_TRUE(IsIdentifierPart(0x101FD)); |
| EXPECT_FALSE(IsIdentifierStart(0x11002)); // Category Mc |
| EXPECT_TRUE(IsIdentifierPart(0x11002)); |
| EXPECT_FALSE(IsIdentifierStart(0x104A9)); // Category Nd |
| EXPECT_TRUE(IsIdentifierPart(0x104A9)); |
| |
| // Neither. |
| EXPECT_FALSE(IsIdentifierStart(0x10111)); // Category No |
| EXPECT_FALSE(IsIdentifierPart(0x10111)); |
| EXPECT_FALSE(IsIdentifierStart(0x1F4A9)); // Category So |
| EXPECT_FALSE(IsIdentifierPart(0x1F4A9)); |
| } |
| #endif // V8_INTL_SUPPORT |
| |
| } // namespace internal |
| } // namespace v8 |