| /* |
| * Copyright (C) 2008 Apple Inc. All rights reserved. |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions |
| * are met: |
| * 1. Redistributions of source code must retain the above copyright |
| * notice, this list of conditions and the following disclaimer. |
| * 2. Redistributions in binary form must reproduce the above copyright |
| * notice, this list of conditions and the following disclaimer in the |
| * documentation and/or other materials provided with the distribution. |
| * |
| * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY |
| * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
| * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR |
| * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR |
| * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
| * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
| * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
| * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY |
| * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| */ |
| |
| #include "config.h" |
| #include "CharacterClass.h" |
| |
| #if ENABLE(WREC) |
| |
| using namespace WTF; |
| |
| namespace JSC { namespace WREC { |
| |
| const CharacterClass& CharacterClass::newline() { |
| static const UChar asciiNewlines[2] = { '\n', '\r' }; |
| static const UChar unicodeNewlines[2] = { 0x2028, 0x2029 }; |
| static const CharacterClass charClass = { |
| asciiNewlines, 2, |
| 0, 0, |
| unicodeNewlines, 2, |
| 0, 0, |
| }; |
| |
| return charClass; |
| } |
| |
| const CharacterClass& CharacterClass::digits() { |
| static const CharacterRange asciiDigitsRange[1] = { { '0', '9' } }; |
| static const CharacterClass charClass = { |
| 0, 0, |
| asciiDigitsRange, 1, |
| 0, 0, |
| 0, 0, |
| }; |
| |
| return charClass; |
| } |
| |
| const CharacterClass& CharacterClass::spaces() { |
| static const UChar asciiSpaces[1] = { ' ' }; |
| static const CharacterRange asciiSpacesRange[1] = { { '\t', '\r' } }; |
| static const UChar unicodeSpaces[8] = { 0x00a0, 0x1680, 0x180e, 0x2028, 0x2029, 0x202f, 0x205f, 0x3000 }; |
| static const CharacterRange unicodeSpacesRange[1] = { { 0x2000, 0x200a } }; |
| static const CharacterClass charClass = { |
| asciiSpaces, 1, |
| asciiSpacesRange, 1, |
| unicodeSpaces, 8, |
| unicodeSpacesRange, 1, |
| }; |
| |
| return charClass; |
| } |
| |
| const CharacterClass& CharacterClass::wordchar() { |
| static const UChar asciiWordchar[1] = { '_' }; |
| static const CharacterRange asciiWordcharRange[3] = { { '0', '9' }, { 'A', 'Z' }, { 'a', 'z' } }; |
| static const CharacterClass charClass = { |
| asciiWordchar, 1, |
| asciiWordcharRange, 3, |
| 0, 0, |
| 0, 0, |
| }; |
| |
| return charClass; |
| } |
| |
| const CharacterClass& CharacterClass::nondigits() { |
| static const CharacterRange asciiNondigitsRange[2] = { { 0, '0' - 1 }, { '9' + 1, 0x7f } }; |
| static const CharacterRange unicodeNondigitsRange[1] = { { 0x0080, 0xffff } }; |
| static const CharacterClass charClass = { |
| 0, 0, |
| asciiNondigitsRange, 2, |
| 0, 0, |
| unicodeNondigitsRange, 1, |
| }; |
| |
| return charClass; |
| } |
| |
| const CharacterClass& CharacterClass::nonspaces() { |
| static const CharacterRange asciiNonspacesRange[3] = { { 0, '\t' - 1 }, { '\r' + 1, ' ' - 1 }, { ' ' + 1, 0x7f } }; |
| static const CharacterRange unicodeNonspacesRange[9] = { |
| { 0x0080, 0x009f }, |
| { 0x00a1, 0x167f }, |
| { 0x1681, 0x180d }, |
| { 0x180f, 0x1fff }, |
| { 0x200b, 0x2027 }, |
| { 0x202a, 0x202e }, |
| { 0x2030, 0x205e }, |
| { 0x2060, 0x2fff }, |
| { 0x3001, 0xffff } |
| }; |
| static const CharacterClass charClass = { |
| 0, 0, |
| asciiNonspacesRange, 3, |
| 0, 0, |
| unicodeNonspacesRange, 9, |
| }; |
| |
| return charClass; |
| } |
| |
| const CharacterClass& CharacterClass::nonwordchar() { |
| static const UChar asciiNonwordchar[1] = { '`' }; |
| static const CharacterRange asciiNonwordcharRange[4] = { { 0, '0' - 1 }, { '9' + 1, 'A' - 1 }, { 'Z' + 1, '_' - 1 }, { 'z' + 1, 0x7f } }; |
| static const CharacterRange unicodeNonwordcharRange[1] = { { 0x0080, 0xffff } }; |
| static const CharacterClass charClass = { |
| asciiNonwordchar, 1, |
| asciiNonwordcharRange, 4, |
| 0, 0, |
| unicodeNonwordcharRange, 1, |
| }; |
| |
| return charClass; |
| } |
| |
| } } // namespace JSC::WREC |
| |
| #endif // ENABLE(WREC) |