| /* |
| * Copyright (C) 2006 George Staikos <staikos@kde.org> |
| * Copyright (C) 2006 Alexey Proskuryakov <ap@nypop.com> |
| * Copyright (C) 2007 Apple Computer, Inc. All rights reserved. |
| * Copyright (C) 2007-2009 Torch Mobile, Inc. |
| * |
| * This library is free software; you can redistribute it and/or |
| * modify it under the terms of the GNU Library General Public |
| * License as published by the Free Software Foundation; either |
| * version 2 of the License, or (at your option) any later version. |
| * |
| * This library is distributed in the hope that it will be useful, |
| * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU |
| * Library General Public License for more details. |
| * |
| * You should have received a copy of the GNU Library General Public License |
| * along with this library; see the file COPYING.LIB. If not, write to |
| * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, |
| * Boston, MA 02110-1301, USA. |
| * |
| */ |
| |
| #ifndef UNICODE_WINCE_H |
| #define UNICODE_WINCE_H |
| |
| #include "ce_unicode.h" |
| |
| #define TO_MASK(x) (1 << (x)) |
| |
| // some defines from ICU needed one or two places |
| |
| #define U16_IS_LEAD(c) (((c) & 0xfffffc00) == 0xd800) |
| #define U16_IS_TRAIL(c) (((c) & 0xfffffc00) == 0xdc00) |
| #define U16_SURROGATE_OFFSET ((0xd800 << 10UL) + 0xdc00 - 0x10000) |
| #define U16_GET_SUPPLEMENTARY(lead, trail) \ |
| (((UChar32)(lead) << 10UL) + (UChar32)(trail) - U16_SURROGATE_OFFSET) |
| |
| #define U16_LEAD(supplementary) (UChar)(((supplementary) >> 10) + 0xd7c0) |
| #define U16_TRAIL(supplementary) (UChar)(((supplementary) & 0x3ff) | 0xdc00) |
| |
| #define U_IS_SURROGATE(c) (((c) & 0xfffff800) == 0xd800) |
| #define U16_IS_SURROGATE(c) U_IS_SURROGATE(c) |
| #define U16_IS_SURROGATE_LEAD(c) (((c) & 0x400) == 0) |
| |
| #define U16_NEXT(s, i, length, c) { \ |
| (c)=(s)[(i)++]; \ |
| if (U16_IS_LEAD(c)) { \ |
| uint16_t __c2; \ |
| if ((i) < (length) && U16_IS_TRAIL(__c2 = (s)[(i)])) { \ |
| ++(i); \ |
| (c) = U16_GET_SUPPLEMENTARY((c), __c2); \ |
| } \ |
| } \ |
| } |
| |
| #define U16_PREV(s, start, i, c) { \ |
| (c)=(s)[--(i)]; \ |
| if (U16_IS_TRAIL(c)) { \ |
| uint16_t __c2; \ |
| if ((i) > (start) && U16_IS_LEAD(__c2 = (s)[(i) - 1])) { \ |
| --(i); \ |
| (c) = U16_GET_SUPPLEMENTARY(__c2, (c)); \ |
| } \ |
| } \ |
| } |
| |
| #define U16_IS_SINGLE(c) !U_IS_SURROGATE(c) |
| |
| namespace WTF { |
| |
| namespace Unicode { |
| |
| enum Direction { |
| LeftToRight = UnicodeCE::U_LEFT_TO_RIGHT, |
| RightToLeft = UnicodeCE::U_RIGHT_TO_LEFT, |
| EuropeanNumber = UnicodeCE::U_EUROPEAN_NUMBER, |
| EuropeanNumberSeparator = UnicodeCE::U_EUROPEAN_NUMBER_SEPARATOR, |
| EuropeanNumberTerminator = UnicodeCE::U_EUROPEAN_NUMBER_TERMINATOR, |
| ArabicNumber = UnicodeCE::U_ARABIC_NUMBER, |
| CommonNumberSeparator = UnicodeCE::U_COMMON_NUMBER_SEPARATOR, |
| BlockSeparator = UnicodeCE::U_BLOCK_SEPARATOR, |
| SegmentSeparator = UnicodeCE::U_SEGMENT_SEPARATOR, |
| WhiteSpaceNeutral = UnicodeCE::U_WHITE_SPACE_NEUTRAL, |
| OtherNeutral = UnicodeCE::U_OTHER_NEUTRAL, |
| LeftToRightEmbedding = UnicodeCE::U_LEFT_TO_RIGHT_EMBEDDING, |
| LeftToRightOverride = UnicodeCE::U_LEFT_TO_RIGHT_OVERRIDE, |
| RightToLeftArabic = UnicodeCE::U_RIGHT_TO_LEFT_ARABIC, |
| RightToLeftEmbedding = UnicodeCE::U_RIGHT_TO_LEFT_EMBEDDING, |
| RightToLeftOverride = UnicodeCE::U_RIGHT_TO_LEFT_OVERRIDE, |
| PopDirectionalFormat = UnicodeCE::U_POP_DIRECTIONAL_FORMAT, |
| NonSpacingMark = UnicodeCE::U_DIR_NON_SPACING_MARK, |
| BoundaryNeutral = UnicodeCE::U_BOUNDARY_NEUTRAL |
| }; |
| |
| enum DecompositionType { |
| DecompositionNone = UnicodeCE::U_DT_NONE, |
| DecompositionCanonical = UnicodeCE::U_DT_CANONICAL, |
| DecompositionCompat = UnicodeCE::U_DT_COMPAT, |
| DecompositionCircle = UnicodeCE::U_DT_CIRCLE, |
| DecompositionFinal = UnicodeCE::U_DT_FINAL, |
| DecompositionFont = UnicodeCE::U_DT_FONT, |
| DecompositionFraction = UnicodeCE::U_DT_FRACTION, |
| DecompositionInitial = UnicodeCE::U_DT_INITIAL, |
| DecompositionIsolated = UnicodeCE::U_DT_ISOLATED, |
| DecompositionMedial = UnicodeCE::U_DT_MEDIAL, |
| DecompositionNarrow = UnicodeCE::U_DT_NARROW, |
| DecompositionNoBreak = UnicodeCE::U_DT_NOBREAK, |
| DecompositionSmall = UnicodeCE::U_DT_SMALL, |
| DecompositionSquare = UnicodeCE::U_DT_SQUARE, |
| DecompositionSub = UnicodeCE::U_DT_SUB, |
| DecompositionSuper = UnicodeCE::U_DT_SUPER, |
| DecompositionVertical = UnicodeCE::U_DT_VERTICAL, |
| DecompositionWide = UnicodeCE::U_DT_WIDE, |
| }; |
| |
| enum CharCategory { |
| NoCategory = 0, |
| Other_NotAssigned = TO_MASK(UnicodeCE::U_GENERAL_OTHER_TYPES), |
| Letter_Uppercase = TO_MASK(UnicodeCE::U_UPPERCASE_LETTER), |
| Letter_Lowercase = TO_MASK(UnicodeCE::U_LOWERCASE_LETTER), |
| Letter_Titlecase = TO_MASK(UnicodeCE::U_TITLECASE_LETTER), |
| Letter_Modifier = TO_MASK(UnicodeCE::U_MODIFIER_LETTER), |
| Letter_Other = TO_MASK(UnicodeCE::U_OTHER_LETTER), |
| |
| Mark_NonSpacing = TO_MASK(UnicodeCE::U_NON_SPACING_MARK), |
| Mark_Enclosing = TO_MASK(UnicodeCE::U_ENCLOSING_MARK), |
| Mark_SpacingCombining = TO_MASK(UnicodeCE::U_COMBINING_SPACING_MARK), |
| |
| Number_DecimalDigit = TO_MASK(UnicodeCE::U_DECIMAL_DIGIT_NUMBER), |
| Number_Letter = TO_MASK(UnicodeCE::U_LETTER_NUMBER), |
| Number_Other = TO_MASK(UnicodeCE::U_OTHER_NUMBER), |
| |
| Separator_Space = TO_MASK(UnicodeCE::U_SPACE_SEPARATOR), |
| Separator_Line = TO_MASK(UnicodeCE::U_LINE_SEPARATOR), |
| Separator_Paragraph = TO_MASK(UnicodeCE::U_PARAGRAPH_SEPARATOR), |
| |
| Other_Control = TO_MASK(UnicodeCE::U_CONTROL_CHAR), |
| Other_Format = TO_MASK(UnicodeCE::U_FORMAT_CHAR), |
| Other_PrivateUse = TO_MASK(UnicodeCE::U_PRIVATE_USE_CHAR), |
| Other_Surrogate = TO_MASK(UnicodeCE::U_SURROGATE), |
| |
| Punctuation_Dash = TO_MASK(UnicodeCE::U_DASH_PUNCTUATION), |
| Punctuation_Open = TO_MASK(UnicodeCE::U_START_PUNCTUATION), |
| Punctuation_Close = TO_MASK(UnicodeCE::U_END_PUNCTUATION), |
| Punctuation_Connector = TO_MASK(UnicodeCE::U_CONNECTOR_PUNCTUATION), |
| Punctuation_Other = TO_MASK(UnicodeCE::U_OTHER_PUNCTUATION), |
| |
| Symbol_Math = TO_MASK(UnicodeCE::U_MATH_SYMBOL), |
| Symbol_Currency = TO_MASK(UnicodeCE::U_CURRENCY_SYMBOL), |
| Symbol_Modifier = TO_MASK(UnicodeCE::U_MODIFIER_SYMBOL), |
| Symbol_Other = TO_MASK(UnicodeCE::U_OTHER_SYMBOL), |
| |
| Punctuation_InitialQuote = TO_MASK(UnicodeCE::U_INITIAL_PUNCTUATION), |
| Punctuation_FinalQuote = TO_MASK(UnicodeCE::U_FINAL_PUNCTUATION) |
| }; |
| |
| CharCategory category(unsigned int); |
| |
| bool isSpace(wchar_t); |
| bool isLetter(wchar_t); |
| bool isPrintableChar(wchar_t); |
| bool isUpper(wchar_t); |
| bool isLower(wchar_t); |
| bool isPunct(wchar_t); |
| bool isDigit(wchar_t); |
| inline bool isSeparatorSpace(wchar_t c) { return category(c) == Separator_Space; } |
| inline bool isHighSurrogate(wchar_t c) { return (c & 0xfc00) == 0xd800; } |
| inline bool isLowSurrogate(wchar_t c) { return (c & 0xfc00) == 0xdc00; } |
| |
| wchar_t toLower(wchar_t); |
| wchar_t toUpper(wchar_t); |
| wchar_t foldCase(wchar_t); |
| wchar_t toTitleCase(wchar_t); |
| int toLower(wchar_t* result, int resultLength, const wchar_t* source, int sourceLength, bool* isError); |
| int toUpper(wchar_t* result, int resultLength, const wchar_t* source, int sourceLength, bool* isError); |
| int foldCase(UChar* result, int resultLength, const wchar_t* source, int sourceLength, bool* isError); |
| |
| int digitValue(wchar_t); |
| |
| wchar_t mirroredChar(UChar32); |
| unsigned char combiningClass(UChar32); |
| DecompositionType decompositionType(UChar32); |
| Direction direction(UChar32); |
| inline bool isArabicChar(UChar32) |
| { |
| return false; // FIXME: implement! |
| } |
| |
| inline bool hasLineBreakingPropertyComplexContext(UChar32) |
| { |
| return false; // FIXME: implement! |
| } |
| |
| inline int umemcasecmp(const wchar_t* a, const wchar_t* b, int len) |
| { |
| for (int i = 0; i < len; ++i) { |
| wchar_t c1 = foldCase(a[i]); |
| wchar_t c2 = foldCase(b[i]); |
| if (c1 != c2) |
| return c1 - c2; |
| } |
| return 0; |
| } |
| |
| inline UChar32 surrogateToUcs4(wchar_t high, wchar_t low) |
| { |
| return (UChar32(high) << 10) + low - 0x35fdc00; |
| } |
| |
| } // namespace Unicode |
| |
| } // namespace WTF |
| |
| #endif |
| // vim: ts=2 sw=2 et |