2 * Copyright (C) 2004, 2008 Apple Inc. All rights reserved.
4 * Redistribution and use in source and binary forms, with or without
5 * modification, are permitted provided that the following conditions
7 * 1. Redistributions of source code must retain the above copyright
8 * notice, this list of conditions and the following disclaimer.
9 * 2. Redistributions in binary form must reproduce the above copyright
10 * notice, this list of conditions and the following disclaimer in the
11 * documentation and/or other materials provided with the distribution.
13 * THIS SOFTWARE IS PROVIDED BY APPLE COMPUTER, INC. ``AS IS'' AND ANY
14 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
15 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
16 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE COMPUTER, INC. OR
17 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
18 * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
19 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
20 * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
21 * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
22 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
23 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
27 #include "core/editing/HTMLInterchange.h"
29 #include "core/dom/Text.h"
30 #include "core/editing/htmlediting.h"
31 #include "core/rendering/RenderObject.h"
32 #include "core/rendering/RenderText.h"
33 #include "wtf/text/StringBuilder.h"
34 #include "wtf/unicode/CharacterNames.h"
38 String convertHTMLTextToInterchangeFormat(const String& in, const Text& node)
40 // Assume all the text comes from node.
41 if (node.renderer() && node.renderer()->style()->preserveNewline())
44 const char convertedSpaceString[] = "<span class=\"" AppleConvertedSpace "\">\xA0</span>";
45 COMPILE_ASSERT((static_cast<unsigned char>('\xA0') == noBreakSpace), ConvertedSpaceStringSpaceIsNoBreakSpace);
50 unsigned consumed = 0;
51 while (i < in.length()) {
53 if (isCollapsibleWhitespace(in[i])) {
54 // count number of adjoining spaces
56 while (j < in.length() && isCollapsibleWhitespace(in[j]))
58 unsigned count = j - i;
61 unsigned add = count % 3;
64 s.appendLiteral(convertedSpaceString);
66 s.appendLiteral(convertedSpaceString);
70 if (i == 0 || i + 1 == in.length()) // at start or end of string
71 s.appendLiteral(convertedSpaceString);
78 s.appendLiteral(convertedSpaceString);
80 } else if (i + 2 == in.length()) {
82 s.appendLiteral(convertedSpaceString);
83 s.appendLiteral(convertedSpaceString);
85 s.appendLiteral(convertedSpaceString);