| /* |
| * Copyright (C) 2008 Apple Inc. All rights reserved. |
| * |
| * Redistribution and use in source and binary forms, with or without |
| * modification, are permitted provided that the following conditions |
| * are met: |
| * 1. Redistributions of source code must retain the above copyright |
| * notice, this list of conditions and the following disclaimer. |
| * 2. Redistributions in binary form must reproduce the above copyright |
| * notice, this list of conditions and the following disclaimer in the |
| * documentation and/or other materials provided with the distribution. |
| * |
| * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY |
| * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE |
| * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR |
| * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR |
| * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, |
| * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, |
| * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR |
| * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY |
| * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT |
| * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE |
| * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. |
| */ |
| |
| #ifndef CharacterClassConstructor_h |
| #define CharacterClassConstructor_h |
| |
| #include <wtf/Platform.h> |
| |
| #if ENABLE(WREC) |
| |
| #include "CharacterClass.h" |
| #include <wtf/AlwaysInline.h> |
| #include <wtf/Vector.h> |
| #include <wtf/unicode/Unicode.h> |
| |
| namespace JSC { namespace WREC { |
| |
| class CharacterClassConstructor { |
| public: |
| CharacterClassConstructor(bool isCaseInsensitive) |
| : m_charBuffer(-1) |
| , m_isPendingDash(false) |
| , m_isCaseInsensitive(isCaseInsensitive) |
| , m_isUpsideDown(false) |
| { |
| } |
| |
| void flush(); |
| |
| // We need to flush prior to an escaped hyphen to prevent it as being treated as indicating |
| // a range, e.g. [a\-c] we flush prior to adding the hyphen so that this is not treated as |
| // [a-c]. However, we do not want to flush if we have already seen a non escaped hyphen - |
| // e.g. [+-\-] should be treated the same as [+--], producing a range that will also match |
| // a comma. |
| void flushBeforeEscapedHyphen() |
| { |
| if (!m_isPendingDash) |
| flush(); |
| } |
| |
| void put(UChar ch); |
| void append(const CharacterClass& other); |
| |
| bool isUpsideDown() { return m_isUpsideDown; } |
| |
| ALWAYS_INLINE CharacterClass charClass() |
| { |
| CharacterClass newCharClass = { |
| m_matches.begin(), m_matches.size(), |
| m_ranges.begin(), m_ranges.size(), |
| m_matchesUnicode.begin(), m_matchesUnicode.size(), |
| m_rangesUnicode.begin(), m_rangesUnicode.size(), |
| }; |
| |
| return newCharClass; |
| } |
| |
| private: |
| void addSorted(Vector<UChar>& matches, UChar ch); |
| void addSortedRange(Vector<CharacterRange>& ranges, UChar lo, UChar hi); |
| |
| int m_charBuffer; |
| bool m_isPendingDash; |
| bool m_isCaseInsensitive; |
| bool m_isUpsideDown; |
| |
| Vector<UChar> m_matches; |
| Vector<CharacterRange> m_ranges; |
| Vector<UChar> m_matchesUnicode; |
| Vector<CharacterRange> m_rangesUnicode; |
| }; |
| |
| } } // namespace JSC::WREC |
| |
| #endif // ENABLE(WREC) |
| |
| #endif // CharacterClassConstructor_h |