blob: 73d1c3f2c6bfd381bfb93a1ab45e3d7ddd4767ae [file] [log] [blame]
/*
* Copyright (C) 2004, 2008 Apple Inc. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, are permitted provided that the following conditions
* are met:
* 1. Redistributions of source code must retain the above copyright
* notice, this list of conditions and the following disclaimer.
* 2. Redistributions in binary form must reproduce the above copyright
* notice, this list of conditions and the following disclaimer in the
* documentation and/or other materials provided with the distribution.
*
* THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY
* EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
* IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
* PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR
* CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
* EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
* PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
* PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
* OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
* (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
* OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
*/
#include "config.h"
#include "HTMLInterchange.h"
#include "Editing.h"
#include "RenderText.h"
#include "Text.h"
#include <wtf/text/StringBuilder.h>
#include <wtf/unicode/CharacterNames.h>
namespace WebCore {
String convertHTMLTextToInterchangeFormat(const String& in, const Text* node)
{
// Assume all the text comes from node.
if (node->renderer() && node->renderer()->style().preserveNewline())
return in;
const char convertedSpaceString[] = "<span class=\"" AppleConvertedSpace "\">\xA0</span>";
COMPILE_ASSERT((static_cast<unsigned char>('\xA0') == noBreakSpace), ConvertedSpaceStringSpaceIsNoBreakSpace);
StringBuilder s;
unsigned i = 0;
unsigned consumed = 0;
while (i < in.length()) {
consumed = 1;
if (deprecatedIsCollapsibleWhitespace(in[i])) {
// count number of adjoining spaces
unsigned j = i + 1;
while (j < in.length() && deprecatedIsCollapsibleWhitespace(in[j]))
j++;
unsigned count = j - i;
consumed = count;
while (count) {
unsigned add = count % 3;
switch (add) {
case 0:
s.append(convertedSpaceString, ' ', convertedSpaceString);
add = 3;
break;
case 1:
if (i == 0 || i + 1 == in.length()) // at start or end of string
s.append(convertedSpaceString);
else
s.append(' ');
break;
case 2:
if (i == 0) {
// at start of string
s.append(convertedSpaceString, ' ');
} else if (i + 2 == in.length()) {
// at end of string
s.append(convertedSpaceString, convertedSpaceString);
} else {
s.append(convertedSpaceString, ' ');
}
break;
}
count -= add;
}
} else
s.append(in[i]);
i += consumed;
}
return s.toString();
}
} // namespace WebCore