blob: 3f27a8de5873b76f71e041b2ccb26ac41231e220 [file] [log] [blame]
/*
* Copyright (C) 2004 Apple Computer, Inc. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY APPLE COMPUTER, INC. ``AS IS'' AND ANY
* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE COMPUTER, INC. OR
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#ifndef KHTML_EDITING_VISIBLE_TEXT_H
#define KHTML_EDITING_VISIBLE_TEXT_H
#include "InlineTextBox.h"
#include "DeprecatedString.h"
#include "Range.h"
#include <kxmlcore/Vector.h>
namespace WebCore {
// FIXME: Can't really answer this question correctly without knowing the white-space mode.
// FIXME: Move this along with the white-space position functions above
// somewhere else in the editing directory. It doesn't belong here.
inline bool isCollapsibleWhitespace(const QChar& c)
{
switch (c.unicode()) {
case ' ':
case '\n':
return true;
default:
return false;
}
}
DeprecatedString plainText(const Range *);
PassRefPtr<Range> findPlainText(const Range *, const DeprecatedString &, bool forward, bool caseSensitive);
// Iterates through the DOM range, returning all the text, and 0-length boundaries
// at points where replaced elements break up the text flow. The text comes back in
// chunks so as to optimize for performance of the iteration.
enum IteratorKind { CONTENT = 0, RUNFINDER = 1 };
class TextIterator
{
public:
TextIterator();
explicit TextIterator(const Range *, IteratorKind kind = CONTENT );
bool atEnd() const { return !m_positionNode; }
void advance();
int length() const { return m_textLength; }
const QChar *characters() const { return m_textCharacters; }
PassRefPtr<Range> range() const;
static int rangeLength(const Range *r);
static PassRefPtr<Range> rangeFromLocationAndLength(Document *doc, int rangeLocation, int rangeLength);
private:
void exitNode();
bool handleTextNode();
bool handleReplacedElement();
bool handleNonTextNode();
void handleTextBox();
void emitCharacter(QChar, Node *textNode, Node *offsetBaseNode, int textStartOffset, int textEndOffset);
// Current position, not necessarily of the text being returned, but position
// as we walk through the DOM tree.
Node *m_node;
int m_offset;
bool m_handledNode;
bool m_handledChildren;
// End of the range.
Node *m_endContainer;
int m_endOffset;
Node *m_pastEndNode;
// The current text and its position, in the form to be returned from the iterator.
Node *m_positionNode;
mutable Node *m_positionOffsetBaseNode;
mutable int m_positionStartOffset;
mutable int m_positionEndOffset;
const QChar *m_textCharacters;
int m_textLength;
// Used when there is still some pending text from the current node; when these
// are false and 0, we go back to normal iterating.
bool m_needAnotherNewline;
InlineTextBox *m_textBox;
// Used to do the whitespace collapsing logic.
Node *m_lastTextNode;
bool m_lastTextNodeEndedWithCollapsedSpace;
QChar m_lastCharacter;
// Used for whitespace characters that aren't in the DOM, so we can point at them.
QChar m_singleCharacterBuffer;
// Used when text boxes are out of order (Hebrew/Arabic w/ embeded LTR text)
Vector<InlineTextBox*> m_sortedTextBoxes;
size_t m_sortedTextBoxesPosition;
};
// Iterates through the DOM range, returning all the text, and 0-length boundaries
// at points where replaced elements break up the text flow. The text comes back in
// chunks so as to optimize for performance of the iteration.
class SimplifiedBackwardsTextIterator
{
public:
SimplifiedBackwardsTextIterator();
explicit SimplifiedBackwardsTextIterator(const Range *);
bool atEnd() const { return !m_positionNode; }
void advance();
int length() const { return m_textLength; }
const QChar *characters() const { return m_textCharacters; }
PassRefPtr<Range> range() const;
private:
void exitNode();
bool handleTextNode();
bool handleReplacedElement();
bool handleNonTextNode();
void emitCharacter(QChar, Node *Node, int startOffset, int endOffset);
void emitNewlineForBROrText();
// Current position, not necessarily of the text being returned, but position
// as we walk through the DOM tree.
Node *m_node;
int m_offset;
bool m_handledNode;
bool m_handledChildren;
// End of the range.
Node *m_startNode;
int m_startOffset;
// The current text and its position, in the form to be returned from the iterator.
Node *m_positionNode;
int m_positionStartOffset;
int m_positionEndOffset;
const QChar *m_textCharacters;
int m_textLength;
// Used to do the whitespace logic.
Node *m_lastTextNode;
QChar m_lastCharacter;
// Used for whitespace characters that aren't in the DOM, so we can point at them.
QChar m_singleCharacterBuffer;
};
// Builds on the text iterator, adding a character position so we can walk one
// character at a time, or faster, as needed. Useful for searching.
class CharacterIterator {
public:
CharacterIterator();
explicit CharacterIterator(const Range *r);
void advance(int numCharacters);
bool atBreak() const { return m_atBreak; }
bool atEnd() const { return m_textIterator.atEnd(); }
int length() const { return m_textIterator.length() - m_runOffset; }
const QChar *characters() const { return m_textIterator.characters() + m_runOffset; }
DeprecatedString string(int numChars);
int characterOffset() const { return m_offset; }
PassRefPtr<Range> range() const;
private:
int m_offset;
int m_runOffset;
bool m_atBreak;
TextIterator m_textIterator;
};
// Very similar to the TextIterator, except that the chunks of text returned are "well behaved",
// meaning they never end split up a word. This is useful for spellcheck or (perhaps one day) searching.
class WordAwareIterator {
public:
WordAwareIterator();
explicit WordAwareIterator(const Range *r);
bool atEnd() const { return !m_didLookAhead && m_textIterator.atEnd(); }
void advance();
int length() const;
const QChar *characters() const;
// Range of the text we're currently returning
PassRefPtr<Range> range() const { return m_range; }
private:
// text from the previous chunk from the textIterator
const QChar *m_previousText;
int m_previousLength;
// many chunks from textIterator concatenated
DeprecatedString m_buffer;
// Did we have to look ahead in the textIterator to confirm the current chunk?
bool m_didLookAhead;
RefPtr<Range> m_range;
TextIterator m_textIterator;
};
}
#endif