Home | History | Annotate | Download | only in src
      1 /*
      2  * Copyright (C) 2009 Google Inc. All rights reserved.
      3  *
      4  * Redistribution and use in source and binary forms, with or without
      5  * modification, are permitted provided that the following conditions are
      6  * met:
      7  *
      8  *     * Redistributions of source code must retain the above copyright
      9  * notice, this list of conditions and the following disclaimer.
     10  *     * Redistributions in binary form must reproduce the above
     11  * copyright notice, this list of conditions and the following disclaimer
     12  * in the documentation and/or other materials provided with the
     13  * distribution.
     14  *     * Neither the name of Google Inc. nor the names of its
     15  * contributors may be used to endorse or promote products derived from
     16  * this software without specific prior written permission.
     17  *
     18  * THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
     19  * "AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
     20  * LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
     21  * A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT
     22  * OWNER OR CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL,
     23  * SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT
     24  * LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE,
     25  * DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY
     26  * THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     27  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
     28  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     29  */
     30 
     31 #include "config.h"
     32 #include "WebEntities.h"
     33 
     34 #include <string.h>
     35 
     36 #include "PlatformString.h"
     37 #include "StringBuilder.h"
     38 #include <wtf/HashMap.h>
     39 
     40 #include "WebString.h"
     41 
     42 using namespace WebCore;
     43 
     44 namespace {
     45 // Note that this file is also included by HTMLTokenizer.cpp so we are getting
     46 // two copies of the data in memory.  We can fix this by changing the script
     47 // that generated the array to create a static const that is its length, but
     48 // this is low priority since the data is less than 4K. We use anonymous
     49 // namespace to prevent name collisions.
     50 #include "HTMLEntityNames.c" // NOLINT
     51 }
     52 
     53 namespace WebKit {
     54 
     55 void populateMap(WTF::HashMap<int, WebCore::String>& map,
     56                  const Entity* entities,
     57                  size_t entitiesCount,
     58                  bool standardHTML)
     59 {
     60     ASSERT(map.isEmpty());
     61     const Entity* entity = &entities[0];
     62     for (size_t i = 0; i < entitiesCount; i++, entity++) {
     63         int code = entity->code;
     64         String name = entity->name;
     65         // For consistency, use the lowe case for entities that have both.
     66         if (map.contains(code) && map.get(code) == name.lower())
     67             continue;
     68         // Don't register &percnt;, &nsup; and &supl;.
     69         if (standardHTML && (code == '%' || code == 0x2285 || code == 0x00b9))
     70             continue;
     71         map.set(code, name);
     72     }
     73     if (standardHTML)
     74         map.set(static_cast<int>(0x0027), String("#39"));
     75 }
     76 
     77 static const Entity xmlBuiltInEntityCodes[] = {
     78     { "lt", 0x003c },
     79     { "gt", 0x003e },
     80     { "amp", 0x0026 },
     81     { "apos", 0x0027 },
     82     { "quot", 0x0022 }
     83 };
     84 
     85 WebEntities::WebEntities(bool xmlEntities)
     86 {
     87     if (xmlEntities)
     88         populateMap(m_entitiesMap,
     89                     xmlBuiltInEntityCodes,
     90                     sizeof(xmlBuiltInEntityCodes) / sizeof(Entity),
     91                     false);
     92     else
     93         populateMap(m_entitiesMap,
     94                     wordlist,
     95                     sizeof(wordlist) / sizeof(Entity),
     96                     true);
     97 }
     98 
     99 String WebEntities::entityNameByCode(int code) const
    100 {
    101     if (m_entitiesMap.contains(code))
    102         return m_entitiesMap.get(code);
    103     return "";
    104 }
    105 
    106 String WebEntities::convertEntitiesInString(const String& value) const
    107 {
    108     unsigned len = value.length();
    109     const UChar* startPos = value.characters();
    110     const UChar* curPos = startPos;
    111 
    112     // FIXME: Optimize - create StringBuilder only if value has any entities.
    113     StringBuilder result;
    114     while (len--) {
    115         if (m_entitiesMap.contains(*curPos)) {
    116             // Append content before entity code.
    117             if (curPos > startPos)
    118                 result.append(String(startPos, curPos - startPos));
    119             result.append("&");
    120             result.append(m_entitiesMap.get(*curPos));
    121             result.append(";");
    122             startPos = ++curPos;
    123         } else
    124             curPos++;
    125     }
    126     // Append the remaining content.
    127     if (curPos > startPos)
    128         result.append(String(startPos, curPos - startPos));
    129 
    130     return result.toString();
    131 }
    132 
    133 } // namespace WebKit
    134