Home | History | Annotate | Download | only in libxml2
      1 /*
      2  * entities.c : implementation for the XML entities handling
      3  *
      4  * See Copyright for the status of this software.
      5  *
      6  * daniel (at) veillard.com
      7  */
      8 
      9 /* To avoid EBCDIC trouble when parsing on zOS */
     10 #if defined(__MVS__)
     11 #pragma convert("ISO8859-1")
     12 #endif
     13 
     14 #define IN_LIBXML
     15 #include "libxml.h"
     16 
     17 #include <string.h>
     18 #ifdef HAVE_STDLIB_H
     19 #include <stdlib.h>
     20 #endif
     21 #include <libxml/xmlmemory.h>
     22 #include <libxml/hash.h>
     23 #include <libxml/entities.h>
     24 #include <libxml/parser.h>
     25 #include <libxml/parserInternals.h>
     26 #include <libxml/xmlerror.h>
     27 #include <libxml/globals.h>
     28 #include <libxml/dict.h>
     29 
     30 #include "save.h"
     31 
     32 /*
     33  * The XML predefined entities.
     34  */
     35 
     36 static xmlEntity xmlEntityLt = {
     37     NULL, XML_ENTITY_DECL, BAD_CAST "lt",
     38     NULL, NULL, NULL, NULL, NULL, NULL,
     39     BAD_CAST "<", BAD_CAST "<", 1,
     40     XML_INTERNAL_PREDEFINED_ENTITY,
     41     NULL, NULL, NULL, NULL, 0, 1
     42 };
     43 static xmlEntity xmlEntityGt = {
     44     NULL, XML_ENTITY_DECL, BAD_CAST "gt",
     45     NULL, NULL, NULL, NULL, NULL, NULL,
     46     BAD_CAST ">", BAD_CAST ">", 1,
     47     XML_INTERNAL_PREDEFINED_ENTITY,
     48     NULL, NULL, NULL, NULL, 0, 1
     49 };
     50 static xmlEntity xmlEntityAmp = {
     51     NULL, XML_ENTITY_DECL, BAD_CAST "amp",
     52     NULL, NULL, NULL, NULL, NULL, NULL,
     53     BAD_CAST "&", BAD_CAST "&", 1,
     54     XML_INTERNAL_PREDEFINED_ENTITY,
     55     NULL, NULL, NULL, NULL, 0, 1
     56 };
     57 static xmlEntity xmlEntityQuot = {
     58     NULL, XML_ENTITY_DECL, BAD_CAST "quot",
     59     NULL, NULL, NULL, NULL, NULL, NULL,
     60     BAD_CAST "\"", BAD_CAST "\"", 1,
     61     XML_INTERNAL_PREDEFINED_ENTITY,
     62     NULL, NULL, NULL, NULL, 0, 1
     63 };
     64 static xmlEntity xmlEntityApos = {
     65     NULL, XML_ENTITY_DECL, BAD_CAST "apos",
     66     NULL, NULL, NULL, NULL, NULL, NULL,
     67     BAD_CAST "'", BAD_CAST "'", 1,
     68     XML_INTERNAL_PREDEFINED_ENTITY,
     69     NULL, NULL, NULL, NULL, 0, 1
     70 };
     71 
     72 /**
     73  * xmlEntitiesErrMemory:
     74  * @extra:  extra informations
     75  *
     76  * Handle an out of memory condition
     77  */
     78 static void
     79 xmlEntitiesErrMemory(const char *extra)
     80 {
     81     __xmlSimpleError(XML_FROM_TREE, XML_ERR_NO_MEMORY, NULL, NULL, extra);
     82 }
     83 
     84 /**
     85  * xmlEntitiesErr:
     86  * @code:  the error code
     87  * @msg:  the message
     88  *
     89  * Handle an out of memory condition
     90  */
     91 static void LIBXML_ATTR_FORMAT(2,0)
     92 xmlEntitiesErr(xmlParserErrors code, const char *msg)
     93 {
     94     __xmlSimpleError(XML_FROM_TREE, code, NULL, msg, NULL);
     95 }
     96 
     97 /*
     98  * xmlFreeEntity : clean-up an entity record.
     99  */
    100 static void
    101 xmlFreeEntity(xmlEntityPtr entity)
    102 {
    103     xmlDictPtr dict = NULL;
    104 
    105     if (entity == NULL)
    106         return;
    107 
    108     if (entity->doc != NULL)
    109         dict = entity->doc->dict;
    110 
    111 
    112     if ((entity->children) && (entity->owner == 1) &&
    113         (entity == (xmlEntityPtr) entity->children->parent))
    114         xmlFreeNodeList(entity->children);
    115     if (dict != NULL) {
    116         if ((entity->name != NULL) && (!xmlDictOwns(dict, entity->name)))
    117             xmlFree((char *) entity->name);
    118         if ((entity->ExternalID != NULL) &&
    119 	    (!xmlDictOwns(dict, entity->ExternalID)))
    120             xmlFree((char *) entity->ExternalID);
    121         if ((entity->SystemID != NULL) &&
    122 	    (!xmlDictOwns(dict, entity->SystemID)))
    123             xmlFree((char *) entity->SystemID);
    124         if ((entity->URI != NULL) && (!xmlDictOwns(dict, entity->URI)))
    125             xmlFree((char *) entity->URI);
    126         if ((entity->content != NULL)
    127             && (!xmlDictOwns(dict, entity->content)))
    128             xmlFree((char *) entity->content);
    129         if ((entity->orig != NULL) && (!xmlDictOwns(dict, entity->orig)))
    130             xmlFree((char *) entity->orig);
    131     } else {
    132         if (entity->name != NULL)
    133             xmlFree((char *) entity->name);
    134         if (entity->ExternalID != NULL)
    135             xmlFree((char *) entity->ExternalID);
    136         if (entity->SystemID != NULL)
    137             xmlFree((char *) entity->SystemID);
    138         if (entity->URI != NULL)
    139             xmlFree((char *) entity->URI);
    140         if (entity->content != NULL)
    141             xmlFree((char *) entity->content);
    142         if (entity->orig != NULL)
    143             xmlFree((char *) entity->orig);
    144     }
    145     xmlFree(entity);
    146 }
    147 
    148 /*
    149  * xmlCreateEntity:
    150  *
    151  * internal routine doing the entity node strutures allocations
    152  */
    153 static xmlEntityPtr
    154 xmlCreateEntity(xmlDictPtr dict, const xmlChar *name, int type,
    155 	        const xmlChar *ExternalID, const xmlChar *SystemID,
    156 	        const xmlChar *content) {
    157     xmlEntityPtr ret;
    158 
    159     ret = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
    160     if (ret == NULL) {
    161         xmlEntitiesErrMemory("xmlCreateEntity: malloc failed");
    162 	return(NULL);
    163     }
    164     memset(ret, 0, sizeof(xmlEntity));
    165     ret->type = XML_ENTITY_DECL;
    166     ret->checked = 0;
    167 
    168     /*
    169      * fill the structure.
    170      */
    171     ret->etype = (xmlEntityType) type;
    172     if (dict == NULL) {
    173 	ret->name = xmlStrdup(name);
    174 	if (ExternalID != NULL)
    175 	    ret->ExternalID = xmlStrdup(ExternalID);
    176 	if (SystemID != NULL)
    177 	    ret->SystemID = xmlStrdup(SystemID);
    178     } else {
    179         ret->name = xmlDictLookup(dict, name, -1);
    180 	if (ExternalID != NULL)
    181 	    ret->ExternalID = xmlDictLookup(dict, ExternalID, -1);
    182 	if (SystemID != NULL)
    183 	    ret->SystemID = xmlDictLookup(dict, SystemID, -1);
    184     }
    185     if (content != NULL) {
    186         ret->length = xmlStrlen(content);
    187 	if ((dict != NULL) && (ret->length < 5))
    188 	    ret->content = (xmlChar *)
    189 	                   xmlDictLookup(dict, content, ret->length);
    190 	else
    191 	    ret->content = xmlStrndup(content, ret->length);
    192      } else {
    193         ret->length = 0;
    194         ret->content = NULL;
    195     }
    196     ret->URI = NULL; /* to be computed by the layer knowing
    197 			the defining entity */
    198     ret->orig = NULL;
    199     ret->owner = 0;
    200 
    201     return(ret);
    202 }
    203 
    204 /*
    205  * xmlAddEntity : register a new entity for an entities table.
    206  */
    207 static xmlEntityPtr
    208 xmlAddEntity(xmlDtdPtr dtd, const xmlChar *name, int type,
    209 	  const xmlChar *ExternalID, const xmlChar *SystemID,
    210 	  const xmlChar *content) {
    211     xmlDictPtr dict = NULL;
    212     xmlEntitiesTablePtr table = NULL;
    213     xmlEntityPtr ret;
    214 
    215     if (name == NULL)
    216 	return(NULL);
    217     if (dtd == NULL)
    218 	return(NULL);
    219     if (dtd->doc != NULL)
    220         dict = dtd->doc->dict;
    221 
    222     switch (type) {
    223         case XML_INTERNAL_GENERAL_ENTITY:
    224         case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
    225         case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
    226 	    if (dtd->entities == NULL)
    227 		dtd->entities = xmlHashCreateDict(0, dict);
    228 	    table = dtd->entities;
    229 	    break;
    230         case XML_INTERNAL_PARAMETER_ENTITY:
    231         case XML_EXTERNAL_PARAMETER_ENTITY:
    232 	    if (dtd->pentities == NULL)
    233 		dtd->pentities = xmlHashCreateDict(0, dict);
    234 	    table = dtd->pentities;
    235 	    break;
    236         case XML_INTERNAL_PREDEFINED_ENTITY:
    237 	    return(NULL);
    238     }
    239     if (table == NULL)
    240 	return(NULL);
    241     ret = xmlCreateEntity(dict, name, type, ExternalID, SystemID, content);
    242     if (ret == NULL)
    243         return(NULL);
    244     ret->doc = dtd->doc;
    245 
    246     if (xmlHashAddEntry(table, name, ret)) {
    247 	/*
    248 	 * entity was already defined at another level.
    249 	 */
    250         xmlFreeEntity(ret);
    251 	return(NULL);
    252     }
    253     return(ret);
    254 }
    255 
    256 /**
    257  * xmlGetPredefinedEntity:
    258  * @name:  the entity name
    259  *
    260  * Check whether this name is an predefined entity.
    261  *
    262  * Returns NULL if not, otherwise the entity
    263  */
    264 xmlEntityPtr
    265 xmlGetPredefinedEntity(const xmlChar *name) {
    266     if (name == NULL) return(NULL);
    267     switch (name[0]) {
    268         case 'l':
    269 	    if (xmlStrEqual(name, BAD_CAST "lt"))
    270 	        return(&xmlEntityLt);
    271 	    break;
    272         case 'g':
    273 	    if (xmlStrEqual(name, BAD_CAST "gt"))
    274 	        return(&xmlEntityGt);
    275 	    break;
    276         case 'a':
    277 	    if (xmlStrEqual(name, BAD_CAST "amp"))
    278 	        return(&xmlEntityAmp);
    279 	    if (xmlStrEqual(name, BAD_CAST "apos"))
    280 	        return(&xmlEntityApos);
    281 	    break;
    282         case 'q':
    283 	    if (xmlStrEqual(name, BAD_CAST "quot"))
    284 	        return(&xmlEntityQuot);
    285 	    break;
    286 	default:
    287 	    break;
    288     }
    289     return(NULL);
    290 }
    291 
    292 /**
    293  * xmlAddDtdEntity:
    294  * @doc:  the document
    295  * @name:  the entity name
    296  * @type:  the entity type XML_xxx_yyy_ENTITY
    297  * @ExternalID:  the entity external ID if available
    298  * @SystemID:  the entity system ID if available
    299  * @content:  the entity content
    300  *
    301  * Register a new entity for this document DTD external subset.
    302  *
    303  * Returns a pointer to the entity or NULL in case of error
    304  */
    305 xmlEntityPtr
    306 xmlAddDtdEntity(xmlDocPtr doc, const xmlChar *name, int type,
    307 	        const xmlChar *ExternalID, const xmlChar *SystemID,
    308 		const xmlChar *content) {
    309     xmlEntityPtr ret;
    310     xmlDtdPtr dtd;
    311 
    312     if (doc == NULL) {
    313 	xmlEntitiesErr(XML_DTD_NO_DOC,
    314 	        "xmlAddDtdEntity: document is NULL");
    315 	return(NULL);
    316     }
    317     if (doc->extSubset == NULL) {
    318 	xmlEntitiesErr(XML_DTD_NO_DTD,
    319 	        "xmlAddDtdEntity: document without external subset");
    320 	return(NULL);
    321     }
    322     dtd = doc->extSubset;
    323     ret = xmlAddEntity(dtd, name, type, ExternalID, SystemID, content);
    324     if (ret == NULL) return(NULL);
    325 
    326     /*
    327      * Link it to the DTD
    328      */
    329     ret->parent = dtd;
    330     ret->doc = dtd->doc;
    331     if (dtd->last == NULL) {
    332 	dtd->children = dtd->last = (xmlNodePtr) ret;
    333     } else {
    334         dtd->last->next = (xmlNodePtr) ret;
    335 	ret->prev = dtd->last;
    336 	dtd->last = (xmlNodePtr) ret;
    337     }
    338     return(ret);
    339 }
    340 
    341 /**
    342  * xmlAddDocEntity:
    343  * @doc:  the document
    344  * @name:  the entity name
    345  * @type:  the entity type XML_xxx_yyy_ENTITY
    346  * @ExternalID:  the entity external ID if available
    347  * @SystemID:  the entity system ID if available
    348  * @content:  the entity content
    349  *
    350  * Register a new entity for this document.
    351  *
    352  * Returns a pointer to the entity or NULL in case of error
    353  */
    354 xmlEntityPtr
    355 xmlAddDocEntity(xmlDocPtr doc, const xmlChar *name, int type,
    356 	        const xmlChar *ExternalID, const xmlChar *SystemID,
    357 	        const xmlChar *content) {
    358     xmlEntityPtr ret;
    359     xmlDtdPtr dtd;
    360 
    361     if (doc == NULL) {
    362 	xmlEntitiesErr(XML_DTD_NO_DOC,
    363 	        "xmlAddDocEntity: document is NULL");
    364 	return(NULL);
    365     }
    366     if (doc->intSubset == NULL) {
    367 	xmlEntitiesErr(XML_DTD_NO_DTD,
    368 	        "xmlAddDocEntity: document without internal subset");
    369 	return(NULL);
    370     }
    371     dtd = doc->intSubset;
    372     ret = xmlAddEntity(dtd, name, type, ExternalID, SystemID, content);
    373     if (ret == NULL) return(NULL);
    374 
    375     /*
    376      * Link it to the DTD
    377      */
    378     ret->parent = dtd;
    379     ret->doc = dtd->doc;
    380     if (dtd->last == NULL) {
    381 	dtd->children = dtd->last = (xmlNodePtr) ret;
    382     } else {
    383 	dtd->last->next = (xmlNodePtr) ret;
    384 	ret->prev = dtd->last;
    385 	dtd->last = (xmlNodePtr) ret;
    386     }
    387     return(ret);
    388 }
    389 
    390 /**
    391  * xmlNewEntity:
    392  * @doc:  the document
    393  * @name:  the entity name
    394  * @type:  the entity type XML_xxx_yyy_ENTITY
    395  * @ExternalID:  the entity external ID if available
    396  * @SystemID:  the entity system ID if available
    397  * @content:  the entity content
    398  *
    399  * Create a new entity, this differs from xmlAddDocEntity() that if
    400  * the document is NULL or has no internal subset defined, then an
    401  * unlinked entity structure will be returned, it is then the responsability
    402  * of the caller to link it to the document later or free it when not needed
    403  * anymore.
    404  *
    405  * Returns a pointer to the entity or NULL in case of error
    406  */
    407 xmlEntityPtr
    408 xmlNewEntity(xmlDocPtr doc, const xmlChar *name, int type,
    409 	     const xmlChar *ExternalID, const xmlChar *SystemID,
    410 	     const xmlChar *content) {
    411     xmlEntityPtr ret;
    412     xmlDictPtr dict;
    413 
    414     if ((doc != NULL) && (doc->intSubset != NULL)) {
    415 	return(xmlAddDocEntity(doc, name, type, ExternalID, SystemID, content));
    416     }
    417     if (doc != NULL)
    418         dict = doc->dict;
    419     else
    420         dict = NULL;
    421     ret = xmlCreateEntity(dict, name, type, ExternalID, SystemID, content);
    422     if (ret == NULL)
    423         return(NULL);
    424     ret->doc = doc;
    425     return(ret);
    426 }
    427 
    428 /**
    429  * xmlGetEntityFromTable:
    430  * @table:  an entity table
    431  * @name:  the entity name
    432  * @parameter:  look for parameter entities
    433  *
    434  * Do an entity lookup in the table.
    435  * returns the corresponding parameter entity, if found.
    436  *
    437  * Returns A pointer to the entity structure or NULL if not found.
    438  */
    439 static xmlEntityPtr
    440 xmlGetEntityFromTable(xmlEntitiesTablePtr table, const xmlChar *name) {
    441     return((xmlEntityPtr) xmlHashLookup(table, name));
    442 }
    443 
    444 /**
    445  * xmlGetParameterEntity:
    446  * @doc:  the document referencing the entity
    447  * @name:  the entity name
    448  *
    449  * Do an entity lookup in the internal and external subsets and
    450  * returns the corresponding parameter entity, if found.
    451  *
    452  * Returns A pointer to the entity structure or NULL if not found.
    453  */
    454 xmlEntityPtr
    455 xmlGetParameterEntity(xmlDocPtr doc, const xmlChar *name) {
    456     xmlEntitiesTablePtr table;
    457     xmlEntityPtr ret;
    458 
    459     if (doc == NULL)
    460 	return(NULL);
    461     if ((doc->intSubset != NULL) && (doc->intSubset->pentities != NULL)) {
    462 	table = (xmlEntitiesTablePtr) doc->intSubset->pentities;
    463 	ret = xmlGetEntityFromTable(table, name);
    464 	if (ret != NULL)
    465 	    return(ret);
    466     }
    467     if ((doc->extSubset != NULL) && (doc->extSubset->pentities != NULL)) {
    468 	table = (xmlEntitiesTablePtr) doc->extSubset->pentities;
    469 	return(xmlGetEntityFromTable(table, name));
    470     }
    471     return(NULL);
    472 }
    473 
    474 /**
    475  * xmlGetDtdEntity:
    476  * @doc:  the document referencing the entity
    477  * @name:  the entity name
    478  *
    479  * Do an entity lookup in the DTD entity hash table and
    480  * returns the corresponding entity, if found.
    481  * Note: the first argument is the document node, not the DTD node.
    482  *
    483  * Returns A pointer to the entity structure or NULL if not found.
    484  */
    485 xmlEntityPtr
    486 xmlGetDtdEntity(xmlDocPtr doc, const xmlChar *name) {
    487     xmlEntitiesTablePtr table;
    488 
    489     if (doc == NULL)
    490 	return(NULL);
    491     if ((doc->extSubset != NULL) && (doc->extSubset->entities != NULL)) {
    492 	table = (xmlEntitiesTablePtr) doc->extSubset->entities;
    493 	return(xmlGetEntityFromTable(table, name));
    494     }
    495     return(NULL);
    496 }
    497 
    498 /**
    499  * xmlGetDocEntity:
    500  * @doc:  the document referencing the entity
    501  * @name:  the entity name
    502  *
    503  * Do an entity lookup in the document entity hash table and
    504  * returns the corresponding entity, otherwise a lookup is done
    505  * in the predefined entities too.
    506  *
    507  * Returns A pointer to the entity structure or NULL if not found.
    508  */
    509 xmlEntityPtr
    510 xmlGetDocEntity(const xmlDoc *doc, const xmlChar *name) {
    511     xmlEntityPtr cur;
    512     xmlEntitiesTablePtr table;
    513 
    514     if (doc != NULL) {
    515 	if ((doc->intSubset != NULL) && (doc->intSubset->entities != NULL)) {
    516 	    table = (xmlEntitiesTablePtr) doc->intSubset->entities;
    517 	    cur = xmlGetEntityFromTable(table, name);
    518 	    if (cur != NULL)
    519 		return(cur);
    520 	}
    521 	if (doc->standalone != 1) {
    522 	    if ((doc->extSubset != NULL) &&
    523 		(doc->extSubset->entities != NULL)) {
    524 		table = (xmlEntitiesTablePtr) doc->extSubset->entities;
    525 		cur = xmlGetEntityFromTable(table, name);
    526 		if (cur != NULL)
    527 		    return(cur);
    528 	    }
    529 	}
    530     }
    531     return(xmlGetPredefinedEntity(name));
    532 }
    533 
    534 /*
    535  * Macro used to grow the current buffer.
    536  */
    537 #define growBufferReentrant() {						\
    538     xmlChar *tmp;                                                       \
    539     size_t new_size = buffer_size * 2;                                  \
    540     if (new_size < buffer_size) goto mem_error;                         \
    541     tmp = (xmlChar *) xmlRealloc(buffer, new_size);	                \
    542     if (tmp == NULL) goto mem_error;                                    \
    543     buffer = tmp;							\
    544     buffer_size = new_size;						\
    545 }
    546 
    547 /**
    548  * xmlEncodeEntitiesInternal:
    549  * @doc:  the document containing the string
    550  * @input:  A string to convert to XML.
    551  * @attr: are we handling an atrbute value
    552  *
    553  * Do a global encoding of a string, replacing the predefined entities
    554  * and non ASCII values with their entities and CharRef counterparts.
    555  * Contrary to xmlEncodeEntities, this routine is reentrant, and result
    556  * must be deallocated.
    557  *
    558  * Returns A newly allocated string with the substitution done.
    559  */
    560 static xmlChar *
    561 xmlEncodeEntitiesInternal(xmlDocPtr doc, const xmlChar *input, int attr) {
    562     const xmlChar *cur = input;
    563     xmlChar *buffer = NULL;
    564     xmlChar *out = NULL;
    565     size_t buffer_size = 0;
    566     int html = 0;
    567 
    568     if (input == NULL) return(NULL);
    569     if (doc != NULL)
    570         html = (doc->type == XML_HTML_DOCUMENT_NODE);
    571 
    572     /*
    573      * allocate an translation buffer.
    574      */
    575     buffer_size = 1000;
    576     buffer = (xmlChar *) xmlMalloc(buffer_size * sizeof(xmlChar));
    577     if (buffer == NULL) {
    578         xmlEntitiesErrMemory("xmlEncodeEntities: malloc failed");
    579 	return(NULL);
    580     }
    581     out = buffer;
    582 
    583     while (*cur != '\0') {
    584         size_t indx = out - buffer;
    585         if (indx + 100 > buffer_size) {
    586 
    587 	    growBufferReentrant();
    588 	    out = &buffer[indx];
    589 	}
    590 
    591 	/*
    592 	 * By default one have to encode at least '<', '>', '"' and '&' !
    593 	 */
    594 	if (*cur == '<') {
    595 	    const xmlChar *end;
    596 
    597 	    /*
    598 	     * Special handling of server side include in HTML attributes
    599 	     */
    600 	    if (html && attr &&
    601 	        (cur[1] == '!') && (cur[2] == '-') && (cur[3] == '-') &&
    602 	        ((end = xmlStrstr(cur, BAD_CAST "-->")) != NULL)) {
    603 	        while (cur != end) {
    604 		    *out++ = *cur++;
    605 		    indx = out - buffer;
    606 		    if (indx + 100 > buffer_size) {
    607 			growBufferReentrant();
    608 			out = &buffer[indx];
    609 		    }
    610 		}
    611 		*out++ = *cur++;
    612 		*out++ = *cur++;
    613 		*out++ = *cur++;
    614 		continue;
    615 	    }
    616 	    *out++ = '&';
    617 	    *out++ = 'l';
    618 	    *out++ = 't';
    619 	    *out++ = ';';
    620 	} else if (*cur == '>') {
    621 	    *out++ = '&';
    622 	    *out++ = 'g';
    623 	    *out++ = 't';
    624 	    *out++ = ';';
    625 	} else if (*cur == '&') {
    626 	    /*
    627 	     * Special handling of &{...} construct from HTML 4, see
    628 	     * http://www.w3.org/TR/html401/appendix/notes.html#h-B.7.1
    629 	     */
    630 	    if (html && attr && (cur[1] == '{') &&
    631 	        (strchr((const char *) cur, '}'))) {
    632 	        while (*cur != '}') {
    633 		    *out++ = *cur++;
    634 		    indx = out - buffer;
    635 		    if (indx + 100 > buffer_size) {
    636 			growBufferReentrant();
    637 			out = &buffer[indx];
    638 		    }
    639 		}
    640 		*out++ = *cur++;
    641 		continue;
    642 	    }
    643 	    *out++ = '&';
    644 	    *out++ = 'a';
    645 	    *out++ = 'm';
    646 	    *out++ = 'p';
    647 	    *out++ = ';';
    648 	} else if (((*cur >= 0x20) && (*cur < 0x80)) ||
    649 	    (*cur == '\n') || (*cur == '\t') || ((html) && (*cur == '\r'))) {
    650 	    /*
    651 	     * default case, just copy !
    652 	     */
    653 	    *out++ = *cur;
    654 	} else if (*cur >= 0x80) {
    655 	    if (((doc != NULL) && (doc->encoding != NULL)) || (html)) {
    656 		/*
    657 		 * Bjrn Reese <br (at) sseusa.com> provided the patch
    658 	        xmlChar xc;
    659 	        xc = (*cur & 0x3F) << 6;
    660 	        if (cur[1] != 0) {
    661 		    xc += *(++cur) & 0x3F;
    662 		    *out++ = xc;
    663 	        } else
    664 		 */
    665 		*out++ = *cur;
    666 	    } else {
    667 		/*
    668 		 * We assume we have UTF-8 input.
    669 		 */
    670 		char buf[11], *ptr;
    671 		int val = 0, l = 1;
    672 
    673 		if (*cur < 0xC0) {
    674 		    xmlEntitiesErr(XML_CHECK_NOT_UTF8,
    675 			    "xmlEncodeEntities: input not UTF-8");
    676 		    if (doc != NULL)
    677 			doc->encoding = xmlStrdup(BAD_CAST "ISO-8859-1");
    678 		    snprintf(buf, sizeof(buf), "&#%d;", *cur);
    679 		    buf[sizeof(buf) - 1] = 0;
    680 		    ptr = buf;
    681 		    while (*ptr != 0) *out++ = *ptr++;
    682 		    cur++;
    683 		    continue;
    684 		} else if (*cur < 0xE0) {
    685                     val = (cur[0]) & 0x1F;
    686 		    val <<= 6;
    687 		    val |= (cur[1]) & 0x3F;
    688 		    l = 2;
    689 		} else if (*cur < 0xF0) {
    690                     val = (cur[0]) & 0x0F;
    691 		    val <<= 6;
    692 		    val |= (cur[1]) & 0x3F;
    693 		    val <<= 6;
    694 		    val |= (cur[2]) & 0x3F;
    695 		    l = 3;
    696 		} else if (*cur < 0xF8) {
    697                     val = (cur[0]) & 0x07;
    698 		    val <<= 6;
    699 		    val |= (cur[1]) & 0x3F;
    700 		    val <<= 6;
    701 		    val |= (cur[2]) & 0x3F;
    702 		    val <<= 6;
    703 		    val |= (cur[3]) & 0x3F;
    704 		    l = 4;
    705 		}
    706 		if ((l == 1) || (!IS_CHAR(val))) {
    707 		    xmlEntitiesErr(XML_ERR_INVALID_CHAR,
    708 			"xmlEncodeEntities: char out of range\n");
    709 		    if (doc != NULL)
    710 			doc->encoding = xmlStrdup(BAD_CAST "ISO-8859-1");
    711 		    snprintf(buf, sizeof(buf), "&#%d;", *cur);
    712 		    buf[sizeof(buf) - 1] = 0;
    713 		    ptr = buf;
    714 		    while (*ptr != 0) *out++ = *ptr++;
    715 		    cur++;
    716 		    continue;
    717 		}
    718 		/*
    719 		 * We could do multiple things here. Just save as a char ref
    720 		 */
    721 		snprintf(buf, sizeof(buf), "&#x%X;", val);
    722 		buf[sizeof(buf) - 1] = 0;
    723 		ptr = buf;
    724 		while (*ptr != 0) *out++ = *ptr++;
    725 		cur += l;
    726 		continue;
    727 	    }
    728 	} else if (IS_BYTE_CHAR(*cur)) {
    729 	    char buf[11], *ptr;
    730 
    731 	    snprintf(buf, sizeof(buf), "&#%d;", *cur);
    732 	    buf[sizeof(buf) - 1] = 0;
    733             ptr = buf;
    734 	    while (*ptr != 0) *out++ = *ptr++;
    735 	}
    736 	cur++;
    737     }
    738     *out = 0;
    739     return(buffer);
    740 
    741 mem_error:
    742     xmlEntitiesErrMemory("xmlEncodeEntities: realloc failed");
    743     xmlFree(buffer);
    744     return(NULL);
    745 }
    746 
    747 /**
    748  * xmlEncodeAttributeEntities:
    749  * @doc:  the document containing the string
    750  * @input:  A string to convert to XML.
    751  *
    752  * Do a global encoding of a string, replacing the predefined entities
    753  * and non ASCII values with their entities and CharRef counterparts for
    754  * attribute values.
    755  *
    756  * Returns A newly allocated string with the substitution done.
    757  */
    758 xmlChar *
    759 xmlEncodeAttributeEntities(xmlDocPtr doc, const xmlChar *input) {
    760     return xmlEncodeEntitiesInternal(doc, input, 1);
    761 }
    762 
    763 /**
    764  * xmlEncodeEntitiesReentrant:
    765  * @doc:  the document containing the string
    766  * @input:  A string to convert to XML.
    767  *
    768  * Do a global encoding of a string, replacing the predefined entities
    769  * and non ASCII values with their entities and CharRef counterparts.
    770  * Contrary to xmlEncodeEntities, this routine is reentrant, and result
    771  * must be deallocated.
    772  *
    773  * Returns A newly allocated string with the substitution done.
    774  */
    775 xmlChar *
    776 xmlEncodeEntitiesReentrant(xmlDocPtr doc, const xmlChar *input) {
    777     return xmlEncodeEntitiesInternal(doc, input, 0);
    778 }
    779 
    780 /**
    781  * xmlEncodeSpecialChars:
    782  * @doc:  the document containing the string
    783  * @input:  A string to convert to XML.
    784  *
    785  * Do a global encoding of a string, replacing the predefined entities
    786  * this routine is reentrant, and result must be deallocated.
    787  *
    788  * Returns A newly allocated string with the substitution done.
    789  */
    790 xmlChar *
    791 xmlEncodeSpecialChars(const xmlDoc *doc ATTRIBUTE_UNUSED, const xmlChar *input) {
    792     const xmlChar *cur = input;
    793     xmlChar *buffer = NULL;
    794     xmlChar *out = NULL;
    795     size_t buffer_size = 0;
    796     if (input == NULL) return(NULL);
    797 
    798     /*
    799      * allocate an translation buffer.
    800      */
    801     buffer_size = 1000;
    802     buffer = (xmlChar *) xmlMalloc(buffer_size * sizeof(xmlChar));
    803     if (buffer == NULL) {
    804         xmlEntitiesErrMemory("xmlEncodeSpecialChars: malloc failed");
    805 	return(NULL);
    806     }
    807     out = buffer;
    808 
    809     while (*cur != '\0') {
    810         size_t indx = out - buffer;
    811         if (indx + 10 > buffer_size) {
    812 
    813 	    growBufferReentrant();
    814 	    out = &buffer[indx];
    815 	}
    816 
    817 	/*
    818 	 * By default one have to encode at least '<', '>', '"' and '&' !
    819 	 */
    820 	if (*cur == '<') {
    821 	    *out++ = '&';
    822 	    *out++ = 'l';
    823 	    *out++ = 't';
    824 	    *out++ = ';';
    825 	} else if (*cur == '>') {
    826 	    *out++ = '&';
    827 	    *out++ = 'g';
    828 	    *out++ = 't';
    829 	    *out++ = ';';
    830 	} else if (*cur == '&') {
    831 	    *out++ = '&';
    832 	    *out++ = 'a';
    833 	    *out++ = 'm';
    834 	    *out++ = 'p';
    835 	    *out++ = ';';
    836 	} else if (*cur == '"') {
    837 	    *out++ = '&';
    838 	    *out++ = 'q';
    839 	    *out++ = 'u';
    840 	    *out++ = 'o';
    841 	    *out++ = 't';
    842 	    *out++ = ';';
    843 	} else if (*cur == '\r') {
    844 	    *out++ = '&';
    845 	    *out++ = '#';
    846 	    *out++ = '1';
    847 	    *out++ = '3';
    848 	    *out++ = ';';
    849 	} else {
    850 	    /*
    851 	     * Works because on UTF-8, all extended sequences cannot
    852 	     * result in bytes in the ASCII range.
    853 	     */
    854 	    *out++ = *cur;
    855 	}
    856 	cur++;
    857     }
    858     *out = 0;
    859     return(buffer);
    860 
    861 mem_error:
    862     xmlEntitiesErrMemory("xmlEncodeSpecialChars: realloc failed");
    863     xmlFree(buffer);
    864     return(NULL);
    865 }
    866 
    867 /**
    868  * xmlCreateEntitiesTable:
    869  *
    870  * create and initialize an empty entities hash table.
    871  * This really doesn't make sense and should be deprecated
    872  *
    873  * Returns the xmlEntitiesTablePtr just created or NULL in case of error.
    874  */
    875 xmlEntitiesTablePtr
    876 xmlCreateEntitiesTable(void) {
    877     return((xmlEntitiesTablePtr) xmlHashCreate(0));
    878 }
    879 
    880 /**
    881  * xmlFreeEntityWrapper:
    882  * @entity:  An entity
    883  * @name:  its name
    884  *
    885  * Deallocate the memory used by an entities in the hash table.
    886  */
    887 static void
    888 xmlFreeEntityWrapper(void *entity, const xmlChar *name ATTRIBUTE_UNUSED) {
    889     if (entity != NULL)
    890 	xmlFreeEntity((xmlEntityPtr) entity);
    891 }
    892 
    893 /**
    894  * xmlFreeEntitiesTable:
    895  * @table:  An entity table
    896  *
    897  * Deallocate the memory used by an entities hash table.
    898  */
    899 void
    900 xmlFreeEntitiesTable(xmlEntitiesTablePtr table) {
    901     xmlHashFree(table, xmlFreeEntityWrapper);
    902 }
    903 
    904 #ifdef LIBXML_TREE_ENABLED
    905 /**
    906  * xmlCopyEntity:
    907  * @ent:  An entity
    908  *
    909  * Build a copy of an entity
    910  *
    911  * Returns the new xmlEntitiesPtr or NULL in case of error.
    912  */
    913 static void *
    914 xmlCopyEntity(void *payload, const xmlChar *name ATTRIBUTE_UNUSED) {
    915     xmlEntityPtr ent = (xmlEntityPtr) payload;
    916     xmlEntityPtr cur;
    917 
    918     cur = (xmlEntityPtr) xmlMalloc(sizeof(xmlEntity));
    919     if (cur == NULL) {
    920         xmlEntitiesErrMemory("xmlCopyEntity:: malloc failed");
    921 	return(NULL);
    922     }
    923     memset(cur, 0, sizeof(xmlEntity));
    924     cur->type = XML_ENTITY_DECL;
    925 
    926     cur->etype = ent->etype;
    927     if (ent->name != NULL)
    928 	cur->name = xmlStrdup(ent->name);
    929     if (ent->ExternalID != NULL)
    930 	cur->ExternalID = xmlStrdup(ent->ExternalID);
    931     if (ent->SystemID != NULL)
    932 	cur->SystemID = xmlStrdup(ent->SystemID);
    933     if (ent->content != NULL)
    934 	cur->content = xmlStrdup(ent->content);
    935     if (ent->orig != NULL)
    936 	cur->orig = xmlStrdup(ent->orig);
    937     if (ent->URI != NULL)
    938 	cur->URI = xmlStrdup(ent->URI);
    939     return(cur);
    940 }
    941 
    942 /**
    943  * xmlCopyEntitiesTable:
    944  * @table:  An entity table
    945  *
    946  * Build a copy of an entity table.
    947  *
    948  * Returns the new xmlEntitiesTablePtr or NULL in case of error.
    949  */
    950 xmlEntitiesTablePtr
    951 xmlCopyEntitiesTable(xmlEntitiesTablePtr table) {
    952     return(xmlHashCopy(table, xmlCopyEntity));
    953 }
    954 #endif /* LIBXML_TREE_ENABLED */
    955 
    956 #ifdef LIBXML_OUTPUT_ENABLED
    957 
    958 /**
    959  * xmlDumpEntityContent:
    960  * @buf:  An XML buffer.
    961  * @content:  The entity content.
    962  *
    963  * This will dump the quoted string value, taking care of the special
    964  * treatment required by %
    965  */
    966 static void
    967 xmlDumpEntityContent(xmlBufferPtr buf, const xmlChar *content) {
    968     if (buf->alloc == XML_BUFFER_ALLOC_IMMUTABLE) return;
    969     if (xmlStrchr(content, '%')) {
    970         const xmlChar * base, *cur;
    971 
    972 	xmlBufferCCat(buf, "\"");
    973 	base = cur = content;
    974 	while (*cur != 0) {
    975 	    if (*cur == '"') {
    976 		if (base != cur)
    977 		    xmlBufferAdd(buf, base, cur - base);
    978 		xmlBufferAdd(buf, BAD_CAST "&quot;", 6);
    979 		cur++;
    980 		base = cur;
    981 	    } else if (*cur == '%') {
    982 		if (base != cur)
    983 		    xmlBufferAdd(buf, base, cur - base);
    984 		xmlBufferAdd(buf, BAD_CAST "&#x25;", 6);
    985 		cur++;
    986 		base = cur;
    987 	    } else {
    988 		cur++;
    989 	    }
    990 	}
    991 	if (base != cur)
    992 	    xmlBufferAdd(buf, base, cur - base);
    993 	xmlBufferCCat(buf, "\"");
    994     } else {
    995         xmlBufferWriteQuotedString(buf, content);
    996     }
    997 }
    998 
    999 /**
   1000  * xmlDumpEntityDecl:
   1001  * @buf:  An XML buffer.
   1002  * @ent:  An entity table
   1003  *
   1004  * This will dump the content of the entity table as an XML DTD definition
   1005  */
   1006 void
   1007 xmlDumpEntityDecl(xmlBufferPtr buf, xmlEntityPtr ent) {
   1008     if ((buf == NULL) || (ent == NULL)) return;
   1009     switch (ent->etype) {
   1010 	case XML_INTERNAL_GENERAL_ENTITY:
   1011 	    xmlBufferWriteChar(buf, "<!ENTITY ");
   1012 	    xmlBufferWriteCHAR(buf, ent->name);
   1013 	    xmlBufferWriteChar(buf, " ");
   1014 	    if (ent->orig != NULL)
   1015 		xmlBufferWriteQuotedString(buf, ent->orig);
   1016 	    else
   1017 		xmlDumpEntityContent(buf, ent->content);
   1018 	    xmlBufferWriteChar(buf, ">\n");
   1019 	    break;
   1020 	case XML_EXTERNAL_GENERAL_PARSED_ENTITY:
   1021 	    xmlBufferWriteChar(buf, "<!ENTITY ");
   1022 	    xmlBufferWriteCHAR(buf, ent->name);
   1023 	    if (ent->ExternalID != NULL) {
   1024 		 xmlBufferWriteChar(buf, " PUBLIC ");
   1025 		 xmlBufferWriteQuotedString(buf, ent->ExternalID);
   1026 		 xmlBufferWriteChar(buf, " ");
   1027 		 xmlBufferWriteQuotedString(buf, ent->SystemID);
   1028 	    } else {
   1029 		 xmlBufferWriteChar(buf, " SYSTEM ");
   1030 		 xmlBufferWriteQuotedString(buf, ent->SystemID);
   1031 	    }
   1032 	    xmlBufferWriteChar(buf, ">\n");
   1033 	    break;
   1034 	case XML_EXTERNAL_GENERAL_UNPARSED_ENTITY:
   1035 	    xmlBufferWriteChar(buf, "<!ENTITY ");
   1036 	    xmlBufferWriteCHAR(buf, ent->name);
   1037 	    if (ent->ExternalID != NULL) {
   1038 		 xmlBufferWriteChar(buf, " PUBLIC ");
   1039 		 xmlBufferWriteQuotedString(buf, ent->ExternalID);
   1040 		 xmlBufferWriteChar(buf, " ");
   1041 		 xmlBufferWriteQuotedString(buf, ent->SystemID);
   1042 	    } else {
   1043 		 xmlBufferWriteChar(buf, " SYSTEM ");
   1044 		 xmlBufferWriteQuotedString(buf, ent->SystemID);
   1045 	    }
   1046 	    if (ent->content != NULL) { /* Should be true ! */
   1047 		xmlBufferWriteChar(buf, " NDATA ");
   1048 		if (ent->orig != NULL)
   1049 		    xmlBufferWriteCHAR(buf, ent->orig);
   1050 		else
   1051 		    xmlBufferWriteCHAR(buf, ent->content);
   1052 	    }
   1053 	    xmlBufferWriteChar(buf, ">\n");
   1054 	    break;
   1055 	case XML_INTERNAL_PARAMETER_ENTITY:
   1056 	    xmlBufferWriteChar(buf, "<!ENTITY % ");
   1057 	    xmlBufferWriteCHAR(buf, ent->name);
   1058 	    xmlBufferWriteChar(buf, " ");
   1059 	    if (ent->orig == NULL)
   1060 		xmlDumpEntityContent(buf, ent->content);
   1061 	    else
   1062 		xmlBufferWriteQuotedString(buf, ent->orig);
   1063 	    xmlBufferWriteChar(buf, ">\n");
   1064 	    break;
   1065 	case XML_EXTERNAL_PARAMETER_ENTITY:
   1066 	    xmlBufferWriteChar(buf, "<!ENTITY % ");
   1067 	    xmlBufferWriteCHAR(buf, ent->name);
   1068 	    if (ent->ExternalID != NULL) {
   1069 		 xmlBufferWriteChar(buf, " PUBLIC ");
   1070 		 xmlBufferWriteQuotedString(buf, ent->ExternalID);
   1071 		 xmlBufferWriteChar(buf, " ");
   1072 		 xmlBufferWriteQuotedString(buf, ent->SystemID);
   1073 	    } else {
   1074 		 xmlBufferWriteChar(buf, " SYSTEM ");
   1075 		 xmlBufferWriteQuotedString(buf, ent->SystemID);
   1076 	    }
   1077 	    xmlBufferWriteChar(buf, ">\n");
   1078 	    break;
   1079 	default:
   1080 	    xmlEntitiesErr(XML_DTD_UNKNOWN_ENTITY,
   1081 		"xmlDumpEntitiesDecl: internal: unknown type entity type");
   1082     }
   1083 }
   1084 
   1085 /**
   1086  * xmlDumpEntityDeclScan:
   1087  * @ent:  An entity table
   1088  * @buf:  An XML buffer.
   1089  *
   1090  * When using the hash table scan function, arguments need to be reversed
   1091  */
   1092 static void
   1093 xmlDumpEntityDeclScan(void *ent, void *buf,
   1094                       const xmlChar *name ATTRIBUTE_UNUSED) {
   1095     xmlDumpEntityDecl((xmlBufferPtr) buf, (xmlEntityPtr) ent);
   1096 }
   1097 
   1098 /**
   1099  * xmlDumpEntitiesTable:
   1100  * @buf:  An XML buffer.
   1101  * @table:  An entity table
   1102  *
   1103  * This will dump the content of the entity table as an XML DTD definition
   1104  */
   1105 void
   1106 xmlDumpEntitiesTable(xmlBufferPtr buf, xmlEntitiesTablePtr table) {
   1107     xmlHashScan(table, xmlDumpEntityDeclScan, buf);
   1108 }
   1109 #endif /* LIBXML_OUTPUT_ENABLED */
   1110 #define bottom_entities
   1111 #include "elfgcchack.h"
   1112