1 /* 2 * Copyright (C) 2004, 2008 Apple Inc. All rights reserved. 3 * 4 * Redistribution and use in source and binary forms, with or without 5 * modification, are permitted provided that the following conditions 6 * are met: 7 * 1. Redistributions of source code must retain the above copyright 8 * notice, this list of conditions and the following disclaimer. 9 * 2. Redistributions in binary form must reproduce the above copyright 10 * notice, this list of conditions and the following disclaimer in the 11 * documentation and/or other materials provided with the distribution. 12 * 13 * THIS SOFTWARE IS PROVIDED BY APPLE COMPUTER, INC. ``AS IS'' AND ANY 14 * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE 15 * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR 16 * PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL APPLE COMPUTER, INC. OR 17 * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, 18 * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, 19 * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR 20 * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY 21 * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 22 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 23 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 24 */ 25 26 #include "config.h" 27 #include "core/editing/HTMLInterchange.h" 28 29 #include "core/dom/Text.h" 30 #include "core/editing/TextIterator.h" 31 #include "core/rendering/RenderObject.h" 32 #include "wtf/text/StringBuilder.h" 33 #include "wtf/unicode/CharacterNames.h" 34 35 namespace WebCore { 36 37 String convertHTMLTextToInterchangeFormat(const String& in, const Text* node) 38 { 39 // Assume all the text comes from node. 40 if (node->renderer() && node->renderer()->style()->preserveNewline()) 41 return in; 42 43 const char convertedSpaceString[] = "<span class=\"" AppleConvertedSpace "\">\xA0</span>"; 44 COMPILE_ASSERT((static_cast<unsigned char>('\xA0') == noBreakSpace), ConvertedSpaceStringSpaceIsNoBreakSpace); 45 46 StringBuilder s; 47 48 unsigned i = 0; 49 unsigned consumed = 0; 50 while (i < in.length()) { 51 consumed = 1; 52 if (isCollapsibleWhitespace(in[i])) { 53 // count number of adjoining spaces 54 unsigned j = i + 1; 55 while (j < in.length() && isCollapsibleWhitespace(in[j])) 56 j++; 57 unsigned count = j - i; 58 consumed = count; 59 while (count) { 60 unsigned add = count % 3; 61 switch (add) { 62 case 0: 63 s.appendLiteral(convertedSpaceString); 64 s.append(' '); 65 s.appendLiteral(convertedSpaceString); 66 add = 3; 67 break; 68 case 1: 69 if (i == 0 || i + 1 == in.length()) // at start or end of string 70 s.appendLiteral(convertedSpaceString); 71 else 72 s.append(' '); 73 break; 74 case 2: 75 if (i == 0) { 76 // at start of string 77 s.appendLiteral(convertedSpaceString); 78 s.append(' '); 79 } else if (i + 2 == in.length()) { 80 // at end of string 81 s.appendLiteral(convertedSpaceString); 82 s.appendLiteral(convertedSpaceString); 83 } else { 84 s.appendLiteral(convertedSpaceString); 85 s.append(' '); 86 } 87 break; 88 } 89 count -= add; 90 } 91 } else 92 s.append(in[i]); 93 i += consumed; 94 } 95 96 return s.toString(); 97 } 98 99 } // namespace WebCore 100