blob: 962e7320ada071b886f3d7f1d65df4de59ab28a1 [file] [log] [blame]
/*
* Copyright (C) 2006 George Staikos <staikos@kde.org>
* Copyright (C) 2006 Alexey Proskuryakov <ap@nypop.com>
* Copyright (C) 2006, 2007, 2008, 2009 Apple Inc. All rights reserved.
*
* This library is free software; you can redistribute it and/or
* modify it under the terms of the GNU Library General Public
* License as published by the Free Software Foundation; either
* version 2 of the License, or (at your option) any later version.
*
* This library is distributed in the hope that it will be useful,
* but WITHOUT ANY WARRANTY; without even the implied warranty of
* MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
* Library General Public License for more details.
*
* You should have received a copy of the GNU Library General Public License
* along with this library; see the file COPYING.LIB. If not, write to
* the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor,
* Boston, MA 02110-1301, USA.
*
*/
#ifndef WTF_UNICODE_ICU_H
#define WTF_UNICODE_ICU_H
#include <stdlib.h>
#include <unicode/uchar.h>
#include <unicode/uscript.h>
#include <unicode/ustring.h>
#include <unicode/utf16.h>
namespace WTF {
namespace Unicode {
enum Direction {
LeftToRight = U_LEFT_TO_RIGHT,
RightToLeft = U_RIGHT_TO_LEFT,
EuropeanNumber = U_EUROPEAN_NUMBER,
EuropeanNumberSeparator = U_EUROPEAN_NUMBER_SEPARATOR,
EuropeanNumberTerminator = U_EUROPEAN_NUMBER_TERMINATOR,
ArabicNumber = U_ARABIC_NUMBER,
CommonNumberSeparator = U_COMMON_NUMBER_SEPARATOR,
BlockSeparator = U_BLOCK_SEPARATOR,
SegmentSeparator = U_SEGMENT_SEPARATOR,
WhiteSpaceNeutral = U_WHITE_SPACE_NEUTRAL,
OtherNeutral = U_OTHER_NEUTRAL,
LeftToRightEmbedding = U_LEFT_TO_RIGHT_EMBEDDING,
LeftToRightOverride = U_LEFT_TO_RIGHT_OVERRIDE,
RightToLeftArabic = U_RIGHT_TO_LEFT_ARABIC,
RightToLeftEmbedding = U_RIGHT_TO_LEFT_EMBEDDING,
RightToLeftOverride = U_RIGHT_TO_LEFT_OVERRIDE,
PopDirectionalFormat = U_POP_DIRECTIONAL_FORMAT,
NonSpacingMark = U_DIR_NON_SPACING_MARK,
BoundaryNeutral = U_BOUNDARY_NEUTRAL
};
enum DecompositionType {
DecompositionNone = U_DT_NONE,
DecompositionCanonical = U_DT_CANONICAL,
DecompositionCompat = U_DT_COMPAT,
DecompositionCircle = U_DT_CIRCLE,
DecompositionFinal = U_DT_FINAL,
DecompositionFont = U_DT_FONT,
DecompositionFraction = U_DT_FRACTION,
DecompositionInitial = U_DT_INITIAL,
DecompositionIsolated = U_DT_ISOLATED,
DecompositionMedial = U_DT_MEDIAL,
DecompositionNarrow = U_DT_NARROW,
DecompositionNoBreak = U_DT_NOBREAK,
DecompositionSmall = U_DT_SMALL,
DecompositionSquare = U_DT_SQUARE,
DecompositionSub = U_DT_SUB,
DecompositionSuper = U_DT_SUPER,
DecompositionVertical = U_DT_VERTICAL,
DecompositionWide = U_DT_WIDE,
};
enum CharCategory {
NoCategory = 0,
Other_NotAssigned = U_MASK(U_GENERAL_OTHER_TYPES),
Letter_Uppercase = U_MASK(U_UPPERCASE_LETTER),
Letter_Lowercase = U_MASK(U_LOWERCASE_LETTER),
Letter_Titlecase = U_MASK(U_TITLECASE_LETTER),
Letter_Modifier = U_MASK(U_MODIFIER_LETTER),
Letter_Other = U_MASK(U_OTHER_LETTER),
Mark_NonSpacing = U_MASK(U_NON_SPACING_MARK),
Mark_Enclosing = U_MASK(U_ENCLOSING_MARK),
Mark_SpacingCombining = U_MASK(U_COMBINING_SPACING_MARK),
Number_DecimalDigit = U_MASK(U_DECIMAL_DIGIT_NUMBER),
Number_Letter = U_MASK(U_LETTER_NUMBER),
Number_Other = U_MASK(U_OTHER_NUMBER),
Separator_Space = U_MASK(U_SPACE_SEPARATOR),
Separator_Line = U_MASK(U_LINE_SEPARATOR),
Separator_Paragraph = U_MASK(U_PARAGRAPH_SEPARATOR),
Other_Control = U_MASK(U_CONTROL_CHAR),
Other_Format = U_MASK(U_FORMAT_CHAR),
Other_PrivateUse = U_MASK(U_PRIVATE_USE_CHAR),
Other_Surrogate = U_MASK(U_SURROGATE),
Punctuation_Dash = U_MASK(U_DASH_PUNCTUATION),
Punctuation_Open = U_MASK(U_START_PUNCTUATION),
Punctuation_Close = U_MASK(U_END_PUNCTUATION),
Punctuation_Connector = U_MASK(U_CONNECTOR_PUNCTUATION),
Punctuation_Other = U_MASK(U_OTHER_PUNCTUATION),
Symbol_Math = U_MASK(U_MATH_SYMBOL),
Symbol_Currency = U_MASK(U_CURRENCY_SYMBOL),
Symbol_Modifier = U_MASK(U_MODIFIER_SYMBOL),
Symbol_Other = U_MASK(U_OTHER_SYMBOL),
Punctuation_InitialQuote = U_MASK(U_INITIAL_PUNCTUATION),
Punctuation_FinalQuote = U_MASK(U_FINAL_PUNCTUATION)
};
inline UChar32 foldCase(UChar32 c)
{
return u_foldCase(c, U_FOLD_CASE_DEFAULT);
}
inline int foldCase(UChar* result, int resultLength, const UChar* src, int srcLength, bool* error)
{
UErrorCode status = U_ZERO_ERROR;
int realLength = u_strFoldCase(result, resultLength, src, srcLength, U_FOLD_CASE_DEFAULT, &status);
*error = !U_SUCCESS(status);
return realLength;
}
inline int toLower(UChar* result, int resultLength, const UChar* src, int srcLength, bool* error)
{
UErrorCode status = U_ZERO_ERROR;
int realLength = u_strToLower(result, resultLength, src, srcLength, "", &status);
*error = !!U_FAILURE(status);
return realLength;
}
inline UChar32 toLower(UChar32 c)
{
return u_tolower(c);
}
inline UChar32 toUpper(UChar32 c)
{
return u_toupper(c);
}
inline int toUpper(UChar* result, int resultLength, const UChar* src, int srcLength, bool* error)
{
UErrorCode status = U_ZERO_ERROR;
int realLength = u_strToUpper(result, resultLength, src, srcLength, "", &status);
*error = !!U_FAILURE(status);
return realLength;
}
inline UChar32 toTitleCase(UChar32 c)
{
return u_totitle(c);
}
inline bool isArabicChar(UChar32 c)
{
return ublock_getCode(c) == UBLOCK_ARABIC;
}
inline bool isAlphanumeric(UChar32 c)
{
return u_isalnum(c);
}
inline bool isSeparatorSpace(UChar32 c)
{
return u_charType(c) == U_SPACE_SEPARATOR;
}
inline bool isPrintableChar(UChar32 c)
{
return !!u_isprint(c);
}
inline bool isPunct(UChar32 c)
{
return !!u_ispunct(c);
}
inline bool hasLineBreakingPropertyComplexContext(UChar32 c)
{
return u_getIntPropertyValue(c, UCHAR_LINE_BREAK) == U_LB_COMPLEX_CONTEXT;
}
inline UChar32 mirroredChar(UChar32 c)
{
return u_charMirror(c);
}
inline CharCategory category(UChar32 c)
{
return static_cast<CharCategory>(U_GET_GC_MASK(c));
}
inline Direction direction(UChar32 c)
{
return static_cast<Direction>(u_charDirection(c));
}
inline bool isLower(UChar32 c)
{
return !!u_islower(c);
}
inline uint8_t combiningClass(UChar32 c)
{
return u_getCombiningClass(c);
}
inline DecompositionType decompositionType(UChar32 c)
{
return static_cast<DecompositionType>(u_getIntPropertyValue(c, UCHAR_DECOMPOSITION_TYPE));
}
inline int umemcasecmp(const UChar* a, const UChar* b, int len)
{
return u_memcasecmp(a, b, len, U_FOLD_CASE_DEFAULT);
}
} }
#endif // WTF_UNICODE_ICU_H