/* | |
* Copyright (C) 2008 Apple Inc. All rights reserved. | |
* | |
* Redistribution and use in source and binary forms, with or without | |
* modification, are permitted provided that the following conditions | |
* are met: | |
* 1. Redistributions of source code must retain the above copyright | |
* notice, this list of conditions and the following disclaimer. | |
* 2. Redistributions in binary form must reproduce the above copyright | |
* notice, this list of conditions and the following disclaimer in the | |
* documentation and/or other materials provided with the distribution. | |
* | |
* THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY | |
* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE | |
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR | |
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR | |
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, | |
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, | |
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR | |
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY | |
* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT | |
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE | |
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. | |
*/ | |
#include "config.h" | |
#include "CharacterClass.h" | |
#if ENABLE(WREC) | |
using namespace WTF; | |
namespace JSC { namespace WREC { | |
const CharacterClass& CharacterClass::newline() { | |
static const UChar asciiNewlines[2] = { '\n', '\r' }; | |
static const UChar unicodeNewlines[2] = { 0x2028, 0x2029 }; | |
static const CharacterClass charClass = { | |
asciiNewlines, 2, | |
0, 0, | |
unicodeNewlines, 2, | |
0, 0, | |
}; | |
return charClass; | |
} | |
const CharacterClass& CharacterClass::digits() { | |
static const CharacterRange asciiDigitsRange[1] = { { '0', '9' } }; | |
static const CharacterClass charClass = { | |
0, 0, | |
asciiDigitsRange, 1, | |
0, 0, | |
0, 0, | |
}; | |
return charClass; | |
} | |
const CharacterClass& CharacterClass::spaces() { | |
static const UChar asciiSpaces[1] = { ' ' }; | |
static const CharacterRange asciiSpacesRange[1] = { { '\t', '\r' } }; | |
static const UChar unicodeSpaces[8] = { 0x00a0, 0x1680, 0x180e, 0x2028, 0x2029, 0x202f, 0x205f, 0x3000 }; | |
static const CharacterRange unicodeSpacesRange[1] = { { 0x2000, 0x200a } }; | |
static const CharacterClass charClass = { | |
asciiSpaces, 1, | |
asciiSpacesRange, 1, | |
unicodeSpaces, 8, | |
unicodeSpacesRange, 1, | |
}; | |
return charClass; | |
} | |
const CharacterClass& CharacterClass::wordchar() { | |
static const UChar asciiWordchar[1] = { '_' }; | |
static const CharacterRange asciiWordcharRange[3] = { { '0', '9' }, { 'A', 'Z' }, { 'a', 'z' } }; | |
static const CharacterClass charClass = { | |
asciiWordchar, 1, | |
asciiWordcharRange, 3, | |
0, 0, | |
0, 0, | |
}; | |
return charClass; | |
} | |
const CharacterClass& CharacterClass::nondigits() { | |
static const CharacterRange asciiNondigitsRange[2] = { { 0, '0' - 1 }, { '9' + 1, 0x7f } }; | |
static const CharacterRange unicodeNondigitsRange[1] = { { 0x0080, 0xffff } }; | |
static const CharacterClass charClass = { | |
0, 0, | |
asciiNondigitsRange, 2, | |
0, 0, | |
unicodeNondigitsRange, 1, | |
}; | |
return charClass; | |
} | |
const CharacterClass& CharacterClass::nonspaces() { | |
static const CharacterRange asciiNonspacesRange[3] = { { 0, '\t' - 1 }, { '\r' + 1, ' ' - 1 }, { ' ' + 1, 0x7f } }; | |
static const CharacterRange unicodeNonspacesRange[9] = { | |
{ 0x0080, 0x009f }, | |
{ 0x00a1, 0x167f }, | |
{ 0x1681, 0x180d }, | |
{ 0x180f, 0x1fff }, | |
{ 0x200b, 0x2027 }, | |
{ 0x202a, 0x202e }, | |
{ 0x2030, 0x205e }, | |
{ 0x2060, 0x2fff }, | |
{ 0x3001, 0xffff } | |
}; | |
static const CharacterClass charClass = { | |
0, 0, | |
asciiNonspacesRange, 3, | |
0, 0, | |
unicodeNonspacesRange, 9, | |
}; | |
return charClass; | |
} | |
const CharacterClass& CharacterClass::nonwordchar() { | |
static const UChar asciiNonwordchar[1] = { '`' }; | |
static const CharacterRange asciiNonwordcharRange[4] = { { 0, '0' - 1 }, { '9' + 1, 'A' - 1 }, { 'Z' + 1, '_' - 1 }, { 'z' + 1, 0x7f } }; | |
static const CharacterRange unicodeNonwordcharRange[1] = { { 0x0080, 0xffff } }; | |
static const CharacterClass charClass = { | |
asciiNonwordchar, 1, | |
asciiNonwordcharRange, 4, | |
0, 0, | |
unicodeNonwordcharRange, 1, | |
}; | |
return charClass; | |
} | |
} } // namespace JSC::WREC | |
#endif // ENABLE(WREC) |