Home | History | Annotate | Download | only in parser
      1 /*
      2  * Copyright (C) 2008 Apple Inc. All Rights Reserved.
      3  * Copyright (C) 2010 Google, Inc. All Rights Reserved.
      4  *
      5  * Redistribution and use in source and binary forms, with or without
      6  * modification, are permitted provided that the following conditions
      7  * are met:
      8  * 1. Redistributions of source code must retain the above copyright
      9  *    notice, this list of conditions and the following disclaimer.
     10  * 2. Redistributions in binary form must reproduce the above copyright
     11  *    notice, this list of conditions and the following disclaimer in the
     12  *    documentation and/or other materials provided with the distribution.
     13  *
     14  * THIS SOFTWARE IS PROVIDED BY APPLE INC. ``AS IS'' AND ANY
     15  * EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE
     16  * IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
     17  * PURPOSE ARE DISCLAIMED.  IN NO EVENT SHALL APPLE INC. OR
     18  * CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
     19  * EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
     20  * PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
     21  * PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY
     22  * OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT
     23  * (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE
     24  * OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.
     25  */
     26 
     27 #ifndef HTMLEntityParser_h
     28 #define HTMLEntityParser_h
     29 
     30 #include "platform/text/SegmentedString.h"
     31 
     32 namespace blink {
     33 
     34 class DecodedHTMLEntity {
     35 private:
     36     // HTML entities contain at most four UTF-16 code units.
     37     static const unsigned kMaxLength = 4;
     38 
     39 public:
     40     DecodedHTMLEntity() : length(0) { }
     41 
     42     bool isEmpty() const { return !length; }
     43 
     44     void append(UChar c)
     45     {
     46         RELEASE_ASSERT(length < kMaxLength);
     47         data[length++] = c;
     48     }
     49 
     50     void append(UChar32 c)
     51     {
     52         if (U_IS_BMP(c)) {
     53             append(static_cast<UChar>(c));
     54             return;
     55         }
     56         append(U16_LEAD(c));
     57         append(U16_TRAIL(c));
     58     }
     59 
     60     unsigned length;
     61     UChar data[kMaxLength];
     62 };
     63 
     64 bool consumeHTMLEntity(SegmentedString&, DecodedHTMLEntity& decodedEntity, bool& notEnoughCharacters, UChar additionalAllowedCharacter = '\0');
     65 
     66 // Used by the XML parser.  Not suitable for use in HTML parsing.  Use consumeHTMLEntity instead.
     67 size_t decodeNamedEntityToUCharArray(const char*, UChar result[4]);
     68 
     69 }
     70 
     71 #endif
     72