1/*
2 * Copyright (C) 2004, 2008 Apple Inc. All rights reserved.
3 *
4 * Redistribution and use in source and binary forms, with or without
5 * modification, are permitted provided that the following conditions
6 * are met:
7 * 1. Redistributions of source code must retain the above copyright
8 * notice, this list of conditions and the following disclaimer.
9 * 2. Redistributions in binary form must reproduce the above copyright
10 * notice, this list of conditions and the following disclaimer in the
11 * documentation and/or other materials provided with the distribution.
12 *
13 * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY
14 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
15 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
16 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE INC. OR
17 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
18 * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
19 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
20 * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
21 * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
22 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
23 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
24 */
25
26#include "config.h"
27#include "HTMLInterchange.h"
28
29#include "Editing.h"
30#include "RenderElement.h"
31#include "RenderText.h"
32#include "Text.h"
33#include "TextIterator.h"
34#include <wtf/text/StringBuilder.h>
35#include <wtf/unicode/CharacterNames.h>
36
37namespace WebCore {
38
39String convertHTMLTextToInterchangeFormat(const String& in, const Text* node)
40{
41 // Assume all the text comes from node.
42 if (node->renderer() && node->renderer()->style().preserveNewline())
43 return in;
44
45 const char convertedSpaceString[] = "<span class=\"" AppleConvertedSpace "\">\xA0</span>";
46 COMPILE_ASSERT((static_cast<unsigned char>('\xA0') == noBreakSpace), ConvertedSpaceStringSpaceIsNoBreakSpace);
47
48 StringBuilder s;
49
50 unsigned i = 0;
51 unsigned consumed = 0;
52 while (i < in.length()) {
53 consumed = 1;
54 if (deprecatedIsCollapsibleWhitespace(in[i])) {
55 // count number of adjoining spaces
56 unsigned j = i + 1;
57 while (j < in.length() && deprecatedIsCollapsibleWhitespace(in[j]))
58 j++;
59 unsigned count = j - i;
60 consumed = count;
61 while (count) {
62 unsigned add = count % 3;
63 switch (add) {
64 case 0:
65 s.appendLiteral(convertedSpaceString);
66 s.append(' ');
67 s.appendLiteral(convertedSpaceString);
68 add = 3;
69 break;
70 case 1:
71 if (i == 0 || i + 1 == in.length()) // at start or end of string
72 s.appendLiteral(convertedSpaceString);
73 else
74 s.append(' ');
75 break;
76 case 2:
77 if (i == 0) {
78 // at start of string
79 s.appendLiteral(convertedSpaceString);
80 s.append(' ');
81 } else if (i + 2 == in.length()) {
82 // at end of string
83 s.appendLiteral(convertedSpaceString);
84 s.appendLiteral(convertedSpaceString);
85 } else {
86 s.appendLiteral(convertedSpaceString);
87 s.append(' ');
88 }
89 break;
90 }
91 count -= add;
92 }
93 } else
94 s.append(in[i]);
95 i += consumed;
96 }
97
98 return s.toString();
99}
100
101} // namespace WebCore
102