1 /* 2 * Copyright (C) 2009 Google Inc. All rights reserved. 3 * 4 * Redistribution and use in source and binary forms, with or without 5 * modification, are permitted provided that the following conditions are 6 * met: 7 * 8 * * Redistributions of source code must retain the above copyright 9 * notice, this list of conditions and the following disclaimer. 10 * * Redistributions in binary form must reproduce the above 11 * copyright notice, this list of conditions and the following disclaimer 12 * in the documentation and/or other materials provided with the 13 * distribution. 14 * * Neither the name of Google Inc. nor the names of its 15 * contributors may be used to endorse or promote products derived from 16 * this software without specific prior written permission. 17 * 18 * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS 19 * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT 20 * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR 21 * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT 22 * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, 23 * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT 24 * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, 25 * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY 26 * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT 27 * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE 28 * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE. 29 */ 30 31 #include "config.h" 32 #include "WebEntities.h" 33 34 #include <string.h> 35 36 #include "PlatformString.h" 37 #include "StringBuilder.h" 38 #include <wtf/HashMap.h> 39 40 #include "WebString.h" 41 42 using namespace WebCore; 43 44 namespace { 45 // Note that this file is also included by HTMLTokenizer.cpp so we are getting 46 // two copies of the data in memory. We can fix this by changing the script 47 // that generated the array to create a static const that is its length, but 48 // this is low priority since the data is less than 4K. We use anonymous 49 // namespace to prevent name collisions. 50 #include "HTMLEntityNames.c" // NOLINT 51 } 52 53 namespace WebKit { 54 55 void populateMap(WTF::HashMap<int, WebCore::String>& map, 56 const Entity* entities, 57 size_t entitiesCount, 58 bool standardHTML) 59 { 60 ASSERT(map.isEmpty()); 61 const Entity* entity = &entities[0]; 62 for (size_t i = 0; i < entitiesCount; i++, entity++) { 63 int code = entity->code; 64 String name = entity->name; 65 // For consistency, use the lowe case for entities that have both. 66 if (map.contains(code) && map.get(code) == name.lower()) 67 continue; 68 // Don't register %, ⊅ and &supl;. 69 if (standardHTML && (code == '%' || code == 0x2285 || code == 0x00b9)) 70 continue; 71 map.set(code, name); 72 } 73 if (standardHTML) 74 map.set(static_cast<int>(0x0027), String("#39")); 75 } 76 77 static const Entity xmlBuiltInEntityCodes[] = { 78 { "lt", 0x003c }, 79 { "gt", 0x003e }, 80 { "amp", 0x0026 }, 81 { "apos", 0x0027 }, 82 { "quot", 0x0022 } 83 }; 84 85 WebEntities::WebEntities(bool xmlEntities) 86 { 87 if (xmlEntities) 88 populateMap(m_entitiesMap, 89 xmlBuiltInEntityCodes, 90 sizeof(xmlBuiltInEntityCodes) / sizeof(Entity), 91 false); 92 else 93 populateMap(m_entitiesMap, 94 wordlist, 95 sizeof(wordlist) / sizeof(Entity), 96 true); 97 } 98 99 String WebEntities::entityNameByCode(int code) const 100 { 101 if (m_entitiesMap.contains(code)) 102 return m_entitiesMap.get(code); 103 return ""; 104 } 105 106 String WebEntities::convertEntitiesInString(const String& value) const 107 { 108 unsigned len = value.length(); 109 const UChar* startPos = value.characters(); 110 const UChar* curPos = startPos; 111 112 // FIXME: Optimize - create StringBuilder only if value has any entities. 113 StringBuilder result; 114 while (len--) { 115 if (m_entitiesMap.contains(*curPos)) { 116 // Append content before entity code. 117 if (curPos > startPos) 118 result.append(String(startPos, curPos - startPos)); 119 result.append("&"); 120 result.append(m_entitiesMap.get(*curPos)); 121 result.append(";"); 122 startPos = ++curPos; 123 } else 124 curPos++; 125 } 126 // Append the remaining content. 127 if (curPos > startPos) 128 result.append(String(startPos, curPos - startPos)); 129 130 return result.toString(); 131 } 132 133 } // namespace WebKit 134