1 /* 2 * SAX2.c : Default SAX2 handler to build a tree. 3 * 4 * See Copyright for the status of this software. 5 * 6 * Daniel Veillard <daniel (at) veillard.com> 7 */ 8 9 10 #define IN_LIBXML 11 #include "libxml.h" 12 #include <stdlib.h> 13 #include <string.h> 14 #include <limits.h> 15 #include <libxml/xmlmemory.h> 16 #include <libxml/tree.h> 17 #include <libxml/parser.h> 18 #include <libxml/parserInternals.h> 19 #include <libxml/valid.h> 20 #include <libxml/entities.h> 21 #include <libxml/xmlerror.h> 22 #include <libxml/debugXML.h> 23 #include <libxml/xmlIO.h> 24 #include <libxml/SAX.h> 25 #include <libxml/uri.h> 26 #include <libxml/valid.h> 27 #include <libxml/HTMLtree.h> 28 #include <libxml/globals.h> 29 30 /* Define SIZE_T_MAX unless defined through <limits.h>. */ 31 #ifndef SIZE_T_MAX 32 # define SIZE_T_MAX ((size_t)-1) 33 #endif /* !SIZE_T_MAX */ 34 35 /* #define DEBUG_SAX2 */ 36 /* #define DEBUG_SAX2_TREE */ 37 38 /** 39 * TODO: 40 * 41 * macro to flag unimplemented blocks 42 * XML_CATALOG_PREFER user env to select between system/public prefered 43 * option. C.f. Richard Tobin <richard (at) cogsci.ed.ac.uk> 44 *> Just FYI, I am using an environment variable XML_CATALOG_PREFER with 45 *> values "system" and "public". I have made the default be "system" to 46 *> match yours. 47 */ 48 #define TODO \ 49 xmlGenericError(xmlGenericErrorContext, \ 50 "Unimplemented block at %s:%d\n", \ 51 __FILE__, __LINE__); 52 53 /* 54 * xmlSAX2ErrMemory: 55 * @ctxt: an XML validation parser context 56 * @msg: a string to accompany the error message 57 */ 58 static void 59 xmlSAX2ErrMemory(xmlParserCtxtPtr ctxt, const char *msg) { 60 xmlStructuredErrorFunc schannel = NULL; 61 const char *str1 = "out of memory\n"; 62 63 if (ctxt != NULL) { 64 ctxt->errNo = XML_ERR_NO_MEMORY; 65 if ((ctxt->sax != NULL) && (ctxt->sax->initialized == XML_SAX2_MAGIC)) 66 schannel = ctxt->sax->serror; 67 __xmlRaiseError(schannel, 68 ctxt->vctxt.error, ctxt->vctxt.userData, 69 ctxt, NULL, XML_FROM_PARSER, XML_ERR_NO_MEMORY, 70 XML_ERR_ERROR, NULL, 0, (const char *) str1, 71 NULL, NULL, 0, 0, 72 msg, (const char *) str1, NULL); 73 ctxt->errNo = XML_ERR_NO_MEMORY; 74 ctxt->instate = XML_PARSER_EOF; 75 ctxt->disableSAX = 1; 76 } else { 77 __xmlRaiseError(schannel, 78 NULL, NULL, 79 ctxt, NULL, XML_FROM_PARSER, XML_ERR_NO_MEMORY, 80 XML_ERR_ERROR, NULL, 0, (const char *) str1, 81 NULL, NULL, 0, 0, 82 msg, (const char *) str1, NULL); 83 } 84 } 85 86 /** 87 * xmlValidError: 88 * @ctxt: an XML validation parser context 89 * @error: the error number 90 * @msg: the error message 91 * @str1: extra data 92 * @str2: extra data 93 * 94 * Handle a validation error 95 */ 96 static void 97 xmlErrValid(xmlParserCtxtPtr ctxt, xmlParserErrors error, 98 const char *msg, const char *str1, const char *str2) 99 { 100 xmlStructuredErrorFunc schannel = NULL; 101 102 if ((ctxt != NULL) && (ctxt->disableSAX != 0) && 103 (ctxt->instate == XML_PARSER_EOF)) 104 return; 105 if (ctxt != NULL) { 106 ctxt->errNo = error; 107 if ((ctxt->sax != NULL) && (ctxt->sax->initialized == XML_SAX2_MAGIC)) 108 schannel = ctxt->sax->serror; 109 __xmlRaiseError(schannel, 110 ctxt->vctxt.error, ctxt->vctxt.userData, 111 ctxt, NULL, XML_FROM_DTD, error, 112 XML_ERR_ERROR, NULL, 0, (const char *) str1, 113 (const char *) str2, NULL, 0, 0, 114 msg, (const char *) str1, (const char *) str2); 115 ctxt->valid = 0; 116 } else { 117 __xmlRaiseError(schannel, 118 NULL, NULL, 119 ctxt, NULL, XML_FROM_DTD, error, 120 XML_ERR_ERROR, NULL, 0, (const char *) str1, 121 (const char *) str2, NULL, 0, 0, 122 msg, (const char *) str1, (const char *) str2); 123 } 124 } 125 126 /** 127 * xmlFatalErrMsg: 128 * @ctxt: an XML parser context 129 * @error: the error number 130 * @msg: the error message 131 * @str1: an error string 132 * @str2: an error string 133 * 134 * Handle a fatal parser error, i.e. violating Well-Formedness constraints 135 */ 136 static void 137 xmlFatalErrMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error, 138 const char *msg, const xmlChar *str1, const xmlChar *str2) 139 { 140 if ((ctxt != NULL) && (ctxt->disableSAX != 0) && 141 (ctxt->instate == XML_PARSER_EOF)) 142 return; 143 if (ctxt != NULL) 144 ctxt->errNo = error; 145 __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER, error, 146 XML_ERR_FATAL, NULL, 0, 147 (const char *) str1, (const char *) str2, 148 NULL, 0, 0, msg, str1, str2); 149 if (ctxt != NULL) { 150 ctxt->wellFormed = 0; 151 ctxt->valid = 0; 152 if (ctxt->recovery == 0) 153 ctxt->disableSAX = 1; 154 } 155 } 156 157 /** 158 * xmlWarnMsg: 159 * @ctxt: an XML parser context 160 * @error: the error number 161 * @msg: the error message 162 * @str1: an error string 163 * @str2: an error string 164 * 165 * Handle a parser warning 166 */ 167 static void 168 xmlWarnMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error, 169 const char *msg, const xmlChar *str1) 170 { 171 if ((ctxt != NULL) && (ctxt->disableSAX != 0) && 172 (ctxt->instate == XML_PARSER_EOF)) 173 return; 174 if (ctxt != NULL) 175 ctxt->errNo = error; 176 __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER, error, 177 XML_ERR_WARNING, NULL, 0, 178 (const char *) str1, NULL, 179 NULL, 0, 0, msg, str1); 180 } 181 182 /** 183 * xmlNsErrMsg: 184 * @ctxt: an XML parser context 185 * @error: the error number 186 * @msg: the error message 187 * @str1: an error string 188 * @str2: an error string 189 * 190 * Handle a namespace error 191 */ 192 static void 193 xmlNsErrMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error, 194 const char *msg, const xmlChar *str1, const xmlChar *str2) 195 { 196 if ((ctxt != NULL) && (ctxt->disableSAX != 0) && 197 (ctxt->instate == XML_PARSER_EOF)) 198 return; 199 if (ctxt != NULL) 200 ctxt->errNo = error; 201 __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_NAMESPACE, error, 202 XML_ERR_ERROR, NULL, 0, 203 (const char *) str1, (const char *) str2, 204 NULL, 0, 0, msg, str1, str2); 205 } 206 207 /** 208 * xmlNsWarnMsg: 209 * @ctxt: an XML parser context 210 * @error: the error number 211 * @msg: the error message 212 * @str1: an error string 213 * 214 * Handle a namespace warning 215 */ 216 static void 217 xmlNsWarnMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error, 218 const char *msg, const xmlChar *str1, const xmlChar *str2) 219 { 220 if ((ctxt != NULL) && (ctxt->disableSAX != 0) && 221 (ctxt->instate == XML_PARSER_EOF)) 222 return; 223 if (ctxt != NULL) 224 ctxt->errNo = error; 225 __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_NAMESPACE, error, 226 XML_ERR_WARNING, NULL, 0, 227 (const char *) str1, (const char *) str2, 228 NULL, 0, 0, msg, str1, str2); 229 } 230 231 /** 232 * xmlSAX2GetPublicId: 233 * @ctx: the user data (XML parser context) 234 * 235 * Provides the public ID e.g. "-//SGMLSOURCE//DTD DEMO//EN" 236 * 237 * Returns a xmlChar * 238 */ 239 const xmlChar * 240 xmlSAX2GetPublicId(void *ctx ATTRIBUTE_UNUSED) 241 { 242 /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */ 243 return(NULL); 244 } 245 246 /** 247 * xmlSAX2GetSystemId: 248 * @ctx: the user data (XML parser context) 249 * 250 * Provides the system ID, basically URL or filename e.g. 251 * http://www.sgmlsource.com/dtds/memo.dtd 252 * 253 * Returns a xmlChar * 254 */ 255 const xmlChar * 256 xmlSAX2GetSystemId(void *ctx) 257 { 258 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 259 if ((ctx == NULL) || (ctxt->input == NULL)) return(NULL); 260 return((const xmlChar *) ctxt->input->filename); 261 } 262 263 /** 264 * xmlSAX2GetLineNumber: 265 * @ctx: the user data (XML parser context) 266 * 267 * Provide the line number of the current parsing point. 268 * 269 * Returns an int 270 */ 271 int 272 xmlSAX2GetLineNumber(void *ctx) 273 { 274 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 275 if ((ctx == NULL) || (ctxt->input == NULL)) return(0); 276 return(ctxt->input->line); 277 } 278 279 /** 280 * xmlSAX2GetColumnNumber: 281 * @ctx: the user data (XML parser context) 282 * 283 * Provide the column number of the current parsing point. 284 * 285 * Returns an int 286 */ 287 int 288 xmlSAX2GetColumnNumber(void *ctx) 289 { 290 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 291 if ((ctx == NULL) || (ctxt->input == NULL)) return(0); 292 return(ctxt->input->col); 293 } 294 295 /** 296 * xmlSAX2IsStandalone: 297 * @ctx: the user data (XML parser context) 298 * 299 * Is this document tagged standalone ? 300 * 301 * Returns 1 if true 302 */ 303 int 304 xmlSAX2IsStandalone(void *ctx) 305 { 306 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 307 if ((ctx == NULL) || (ctxt->myDoc == NULL)) return(0); 308 return(ctxt->myDoc->standalone == 1); 309 } 310 311 /** 312 * xmlSAX2HasInternalSubset: 313 * @ctx: the user data (XML parser context) 314 * 315 * Does this document has an internal subset 316 * 317 * Returns 1 if true 318 */ 319 int 320 xmlSAX2HasInternalSubset(void *ctx) 321 { 322 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 323 if ((ctxt == NULL) || (ctxt->myDoc == NULL)) return(0); 324 return(ctxt->myDoc->intSubset != NULL); 325 } 326 327 /** 328 * xmlSAX2HasExternalSubset: 329 * @ctx: the user data (XML parser context) 330 * 331 * Does this document has an external subset 332 * 333 * Returns 1 if true 334 */ 335 int 336 xmlSAX2HasExternalSubset(void *ctx) 337 { 338 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 339 if ((ctxt == NULL) || (ctxt->myDoc == NULL)) return(0); 340 return(ctxt->myDoc->extSubset != NULL); 341 } 342 343 /** 344 * xmlSAX2InternalSubset: 345 * @ctx: the user data (XML parser context) 346 * @name: the root element name 347 * @ExternalID: the external ID 348 * @SystemID: the SYSTEM ID (e.g. filename or URL) 349 * 350 * Callback on internal subset declaration. 351 */ 352 void 353 xmlSAX2InternalSubset(void *ctx, const xmlChar *name, 354 const xmlChar *ExternalID, const xmlChar *SystemID) 355 { 356 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 357 xmlDtdPtr dtd; 358 if (ctx == NULL) return; 359 #ifdef DEBUG_SAX 360 xmlGenericError(xmlGenericErrorContext, 361 "SAX.xmlSAX2InternalSubset(%s, %s, %s)\n", 362 name, ExternalID, SystemID); 363 #endif 364 365 if (ctxt->myDoc == NULL) 366 return; 367 dtd = xmlGetIntSubset(ctxt->myDoc); 368 if (dtd != NULL) { 369 if (ctxt->html) 370 return; 371 xmlUnlinkNode((xmlNodePtr) dtd); 372 xmlFreeDtd(dtd); 373 ctxt->myDoc->intSubset = NULL; 374 } 375 ctxt->myDoc->intSubset = 376 xmlCreateIntSubset(ctxt->myDoc, name, ExternalID, SystemID); 377 if (ctxt->myDoc->intSubset == NULL) 378 xmlSAX2ErrMemory(ctxt, "xmlSAX2InternalSubset"); 379 } 380 381 /** 382 * xmlSAX2ExternalSubset: 383 * @ctx: the user data (XML parser context) 384 * @name: the root element name 385 * @ExternalID: the external ID 386 * @SystemID: the SYSTEM ID (e.g. filename or URL) 387 * 388 * Callback on external subset declaration. 389 */ 390 void 391 xmlSAX2ExternalSubset(void *ctx, const xmlChar *name, 392 const xmlChar *ExternalID, const xmlChar *SystemID) 393 { 394 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 395 if (ctx == NULL) return; 396 #ifdef DEBUG_SAX 397 xmlGenericError(xmlGenericErrorContext, 398 "SAX.xmlSAX2ExternalSubset(%s, %s, %s)\n", 399 name, ExternalID, SystemID); 400 #endif 401 if (((ExternalID != NULL) || (SystemID != NULL)) && 402 (((ctxt->validate) || (ctxt->loadsubset != 0)) && 403 (ctxt->wellFormed && ctxt->myDoc))) { 404 /* 405 * Try to fetch and parse the external subset. 406 */ 407 xmlParserInputPtr oldinput; 408 int oldinputNr; 409 int oldinputMax; 410 xmlParserInputPtr *oldinputTab; 411 xmlParserInputPtr input = NULL; 412 xmlCharEncoding enc; 413 int oldcharset; 414 const xmlChar *oldencoding; 415 416 /* 417 * Ask the Entity resolver to load the damn thing 418 */ 419 if ((ctxt->sax != NULL) && (ctxt->sax->resolveEntity != NULL)) 420 input = ctxt->sax->resolveEntity(ctxt->userData, ExternalID, 421 SystemID); 422 if (input == NULL) { 423 return; 424 } 425 426 xmlNewDtd(ctxt->myDoc, name, ExternalID, SystemID); 427 428 /* 429 * make sure we won't destroy the main document context 430 */ 431 oldinput = ctxt->input; 432 oldinputNr = ctxt->inputNr; 433 oldinputMax = ctxt->inputMax; 434 oldinputTab = ctxt->inputTab; 435 oldcharset = ctxt->charset; 436 oldencoding = ctxt->encoding; 437 ctxt->encoding = NULL; 438 439 ctxt->inputTab = (xmlParserInputPtr *) 440 xmlMalloc(5 * sizeof(xmlParserInputPtr)); 441 if (ctxt->inputTab == NULL) { 442 xmlSAX2ErrMemory(ctxt, "xmlSAX2ExternalSubset"); 443 ctxt->input = oldinput; 444 ctxt->inputNr = oldinputNr; 445 ctxt->inputMax = oldinputMax; 446 ctxt->inputTab = oldinputTab; 447 ctxt->charset = oldcharset; 448 ctxt->encoding = oldencoding; 449 return; 450 } 451 ctxt->inputNr = 0; 452 ctxt->inputMax = 5; 453 ctxt->input = NULL; 454 xmlPushInput(ctxt, input); 455 456 /* 457 * On the fly encoding conversion if needed 458 */ 459 if (ctxt->input->length >= 4) { 460 enc = xmlDetectCharEncoding(ctxt->input->cur, 4); 461 xmlSwitchEncoding(ctxt, enc); 462 } 463 464 if (input->filename == NULL) 465 input->filename = (char *) xmlCanonicPath(SystemID); 466 input->line = 1; 467 input->col = 1; 468 input->base = ctxt->input->cur; 469 input->cur = ctxt->input->cur; 470 input->free = NULL; 471 472 /* 473 * let's parse that entity knowing it's an external subset. 474 */ 475 xmlParseExternalSubset(ctxt, ExternalID, SystemID); 476 477 /* 478 * Free up the external entities 479 */ 480 481 while (ctxt->inputNr > 1) 482 xmlPopInput(ctxt); 483 xmlFreeInputStream(ctxt->input); 484 xmlFree(ctxt->inputTab); 485 486 /* 487 * Restore the parsing context of the main entity 488 */ 489 ctxt->input = oldinput; 490 ctxt->inputNr = oldinputNr; 491 ctxt->inputMax = oldinputMax; 492 ctxt->inputTab = oldinputTab; 493 ctxt->charset = oldcharset; 494 if ((ctxt->encoding != NULL) && 495 ((ctxt->dict == NULL) || 496 (!xmlDictOwns(ctxt->dict, ctxt->encoding)))) 497 xmlFree((xmlChar *) ctxt->encoding); 498 ctxt->encoding = oldencoding; 499 /* ctxt->wellFormed = oldwellFormed; */ 500 } 501 } 502 503 /** 504 * xmlSAX2ResolveEntity: 505 * @ctx: the user data (XML parser context) 506 * @publicId: The public ID of the entity 507 * @systemId: The system ID of the entity 508 * 509 * The entity loader, to control the loading of external entities, 510 * the application can either: 511 * - override this xmlSAX2ResolveEntity() callback in the SAX block 512 * - or better use the xmlSetExternalEntityLoader() function to 513 * set up it's own entity resolution routine 514 * 515 * Returns the xmlParserInputPtr if inlined or NULL for DOM behaviour. 516 */ 517 xmlParserInputPtr 518 xmlSAX2ResolveEntity(void *ctx, const xmlChar *publicId, const xmlChar *systemId) 519 { 520 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 521 xmlParserInputPtr ret; 522 xmlChar *URI; 523 const char *base = NULL; 524 525 if (ctx == NULL) return(NULL); 526 if (ctxt->input != NULL) 527 base = ctxt->input->filename; 528 if (base == NULL) 529 base = ctxt->directory; 530 531 URI = xmlBuildURI(systemId, (const xmlChar *) base); 532 533 #ifdef DEBUG_SAX 534 xmlGenericError(xmlGenericErrorContext, 535 "SAX.xmlSAX2ResolveEntity(%s, %s)\n", publicId, systemId); 536 #endif 537 538 ret = xmlLoadExternalEntity((const char *) URI, 539 (const char *) publicId, ctxt); 540 if (URI != NULL) 541 xmlFree(URI); 542 return(ret); 543 } 544 545 /** 546 * xmlSAX2GetEntity: 547 * @ctx: the user data (XML parser context) 548 * @name: The entity name 549 * 550 * Get an entity by name 551 * 552 * Returns the xmlEntityPtr if found. 553 */ 554 xmlEntityPtr 555 xmlSAX2GetEntity(void *ctx, const xmlChar *name) 556 { 557 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 558 xmlEntityPtr ret = NULL; 559 560 if (ctx == NULL) return(NULL); 561 #ifdef DEBUG_SAX 562 xmlGenericError(xmlGenericErrorContext, 563 "SAX.xmlSAX2GetEntity(%s)\n", name); 564 #endif 565 566 if (ctxt->inSubset == 0) { 567 ret = xmlGetPredefinedEntity(name); 568 if (ret != NULL) 569 return(ret); 570 } 571 if ((ctxt->myDoc != NULL) && (ctxt->myDoc->standalone == 1)) { 572 if (ctxt->inSubset == 2) { 573 ctxt->myDoc->standalone = 0; 574 ret = xmlGetDocEntity(ctxt->myDoc, name); 575 ctxt->myDoc->standalone = 1; 576 } else { 577 ret = xmlGetDocEntity(ctxt->myDoc, name); 578 if (ret == NULL) { 579 ctxt->myDoc->standalone = 0; 580 ret = xmlGetDocEntity(ctxt->myDoc, name); 581 if (ret != NULL) { 582 xmlFatalErrMsg(ctxt, XML_ERR_NOT_STANDALONE, 583 "Entity(%s) document marked standalone but requires external subset\n", 584 name, NULL); 585 } 586 ctxt->myDoc->standalone = 1; 587 } 588 } 589 } else { 590 ret = xmlGetDocEntity(ctxt->myDoc, name); 591 } 592 if ((ret != NULL) && 593 ((ctxt->validate) || (ctxt->replaceEntities)) && 594 (ret->children == NULL) && 595 (ret->etype == XML_EXTERNAL_GENERAL_PARSED_ENTITY)) { 596 int val; 597 598 /* 599 * for validation purposes we really need to fetch and 600 * parse the external entity 601 */ 602 xmlNodePtr children; 603 unsigned long oldnbent = ctxt->nbentities; 604 605 val = xmlParseCtxtExternalEntity(ctxt, ret->URI, 606 ret->ExternalID, &children); 607 if (val == 0) { 608 xmlAddChildList((xmlNodePtr) ret, children); 609 } else { 610 xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_PROCESSING, 611 "Failure to process entity %s\n", name, NULL); 612 ctxt->validate = 0; 613 return(NULL); 614 } 615 ret->owner = 1; 616 if (ret->checked == 0) { 617 ret->checked = (ctxt->nbentities - oldnbent + 1) * 2; 618 if ((ret->content != NULL) && (xmlStrchr(ret->content, '<'))) 619 ret->checked |= 1; 620 } 621 } 622 return(ret); 623 } 624 625 /** 626 * xmlSAX2GetParameterEntity: 627 * @ctx: the user data (XML parser context) 628 * @name: The entity name 629 * 630 * Get a parameter entity by name 631 * 632 * Returns the xmlEntityPtr if found. 633 */ 634 xmlEntityPtr 635 xmlSAX2GetParameterEntity(void *ctx, const xmlChar *name) 636 { 637 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 638 xmlEntityPtr ret; 639 640 if (ctx == NULL) return(NULL); 641 #ifdef DEBUG_SAX 642 xmlGenericError(xmlGenericErrorContext, 643 "SAX.xmlSAX2GetParameterEntity(%s)\n", name); 644 #endif 645 646 ret = xmlGetParameterEntity(ctxt->myDoc, name); 647 return(ret); 648 } 649 650 651 /** 652 * xmlSAX2EntityDecl: 653 * @ctx: the user data (XML parser context) 654 * @name: the entity name 655 * @type: the entity type 656 * @publicId: The public ID of the entity 657 * @systemId: The system ID of the entity 658 * @content: the entity value (without processing). 659 * 660 * An entity definition has been parsed 661 */ 662 void 663 xmlSAX2EntityDecl(void *ctx, const xmlChar *name, int type, 664 const xmlChar *publicId, const xmlChar *systemId, xmlChar *content) 665 { 666 xmlEntityPtr ent; 667 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 668 669 if (ctx == NULL) return; 670 #ifdef DEBUG_SAX 671 xmlGenericError(xmlGenericErrorContext, 672 "SAX.xmlSAX2EntityDecl(%s, %d, %s, %s, %s)\n", 673 name, type, publicId, systemId, content); 674 #endif 675 if (ctxt->inSubset == 1) { 676 ent = xmlAddDocEntity(ctxt->myDoc, name, type, publicId, 677 systemId, content); 678 if ((ent == NULL) && (ctxt->pedantic)) 679 xmlWarnMsg(ctxt, XML_WAR_ENTITY_REDEFINED, 680 "Entity(%s) already defined in the internal subset\n", 681 name); 682 if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) { 683 xmlChar *URI; 684 const char *base = NULL; 685 686 if (ctxt->input != NULL) 687 base = ctxt->input->filename; 688 if (base == NULL) 689 base = ctxt->directory; 690 691 URI = xmlBuildURI(systemId, (const xmlChar *) base); 692 ent->URI = URI; 693 } 694 } else if (ctxt->inSubset == 2) { 695 ent = xmlAddDtdEntity(ctxt->myDoc, name, type, publicId, 696 systemId, content); 697 if ((ent == NULL) && (ctxt->pedantic) && 698 (ctxt->sax != NULL) && (ctxt->sax->warning != NULL)) 699 ctxt->sax->warning(ctxt->userData, 700 "Entity(%s) already defined in the external subset\n", name); 701 if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) { 702 xmlChar *URI; 703 const char *base = NULL; 704 705 if (ctxt->input != NULL) 706 base = ctxt->input->filename; 707 if (base == NULL) 708 base = ctxt->directory; 709 710 URI = xmlBuildURI(systemId, (const xmlChar *) base); 711 ent->URI = URI; 712 } 713 } else { 714 xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_PROCESSING, 715 "SAX.xmlSAX2EntityDecl(%s) called while not in subset\n", 716 name, NULL); 717 } 718 } 719 720 /** 721 * xmlSAX2AttributeDecl: 722 * @ctx: the user data (XML parser context) 723 * @elem: the name of the element 724 * @fullname: the attribute name 725 * @type: the attribute type 726 * @def: the type of default value 727 * @defaultValue: the attribute default value 728 * @tree: the tree of enumerated value set 729 * 730 * An attribute definition has been parsed 731 */ 732 void 733 xmlSAX2AttributeDecl(void *ctx, const xmlChar *elem, const xmlChar *fullname, 734 int type, int def, const xmlChar *defaultValue, 735 xmlEnumerationPtr tree) 736 { 737 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 738 xmlAttributePtr attr; 739 xmlChar *name = NULL, *prefix = NULL; 740 741 if ((ctxt == NULL) || (ctxt->myDoc == NULL)) 742 return; 743 744 #ifdef DEBUG_SAX 745 xmlGenericError(xmlGenericErrorContext, 746 "SAX.xmlSAX2AttributeDecl(%s, %s, %d, %d, %s, ...)\n", 747 elem, fullname, type, def, defaultValue); 748 #endif 749 if ((xmlStrEqual(fullname, BAD_CAST "xml:id")) && 750 (type != XML_ATTRIBUTE_ID)) { 751 /* 752 * Raise the error but keep the validity flag 753 */ 754 int tmp = ctxt->valid; 755 xmlErrValid(ctxt, XML_DTD_XMLID_TYPE, 756 "xml:id : attribute type should be ID\n", NULL, NULL); 757 ctxt->valid = tmp; 758 } 759 /* TODO: optimize name/prefix allocation */ 760 name = xmlSplitQName(ctxt, fullname, &prefix); 761 ctxt->vctxt.valid = 1; 762 if (ctxt->inSubset == 1) 763 attr = xmlAddAttributeDecl(&ctxt->vctxt, ctxt->myDoc->intSubset, elem, 764 name, prefix, (xmlAttributeType) type, 765 (xmlAttributeDefault) def, defaultValue, tree); 766 else if (ctxt->inSubset == 2) 767 attr = xmlAddAttributeDecl(&ctxt->vctxt, ctxt->myDoc->extSubset, elem, 768 name, prefix, (xmlAttributeType) type, 769 (xmlAttributeDefault) def, defaultValue, tree); 770 else { 771 xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR, 772 "SAX.xmlSAX2AttributeDecl(%s) called while not in subset\n", 773 name, NULL); 774 xmlFreeEnumeration(tree); 775 return; 776 } 777 #ifdef LIBXML_VALID_ENABLED 778 if (ctxt->vctxt.valid == 0) 779 ctxt->valid = 0; 780 if ((attr != NULL) && (ctxt->validate) && (ctxt->wellFormed) && 781 (ctxt->myDoc->intSubset != NULL)) 782 ctxt->valid &= xmlValidateAttributeDecl(&ctxt->vctxt, ctxt->myDoc, 783 attr); 784 #endif /* LIBXML_VALID_ENABLED */ 785 if (prefix != NULL) 786 xmlFree(prefix); 787 if (name != NULL) 788 xmlFree(name); 789 } 790 791 /** 792 * xmlSAX2ElementDecl: 793 * @ctx: the user data (XML parser context) 794 * @name: the element name 795 * @type: the element type 796 * @content: the element value tree 797 * 798 * An element definition has been parsed 799 */ 800 void 801 xmlSAX2ElementDecl(void *ctx, const xmlChar * name, int type, 802 xmlElementContentPtr content) 803 { 804 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 805 xmlElementPtr elem = NULL; 806 807 if ((ctxt == NULL) || (ctxt->myDoc == NULL)) 808 return; 809 810 #ifdef DEBUG_SAX 811 xmlGenericError(xmlGenericErrorContext, 812 "SAX.xmlSAX2ElementDecl(%s, %d, ...)\n", name, type); 813 #endif 814 815 if (ctxt->inSubset == 1) 816 elem = xmlAddElementDecl(&ctxt->vctxt, ctxt->myDoc->intSubset, 817 name, (xmlElementTypeVal) type, content); 818 else if (ctxt->inSubset == 2) 819 elem = xmlAddElementDecl(&ctxt->vctxt, ctxt->myDoc->extSubset, 820 name, (xmlElementTypeVal) type, content); 821 else { 822 xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR, 823 "SAX.xmlSAX2ElementDecl(%s) called while not in subset\n", 824 name, NULL); 825 return; 826 } 827 #ifdef LIBXML_VALID_ENABLED 828 if (elem == NULL) 829 ctxt->valid = 0; 830 if (ctxt->validate && ctxt->wellFormed && 831 ctxt->myDoc && ctxt->myDoc->intSubset) 832 ctxt->valid &= 833 xmlValidateElementDecl(&ctxt->vctxt, ctxt->myDoc, elem); 834 #endif /* LIBXML_VALID_ENABLED */ 835 } 836 837 /** 838 * xmlSAX2NotationDecl: 839 * @ctx: the user data (XML parser context) 840 * @name: The name of the notation 841 * @publicId: The public ID of the entity 842 * @systemId: The system ID of the entity 843 * 844 * What to do when a notation declaration has been parsed. 845 */ 846 void 847 xmlSAX2NotationDecl(void *ctx, const xmlChar *name, 848 const xmlChar *publicId, const xmlChar *systemId) 849 { 850 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 851 xmlNotationPtr nota = NULL; 852 853 if ((ctxt == NULL) || (ctxt->myDoc == NULL)) 854 return; 855 856 #ifdef DEBUG_SAX 857 xmlGenericError(xmlGenericErrorContext, 858 "SAX.xmlSAX2NotationDecl(%s, %s, %s)\n", name, publicId, systemId); 859 #endif 860 861 if ((publicId == NULL) && (systemId == NULL)) { 862 xmlFatalErrMsg(ctxt, XML_ERR_NOTATION_PROCESSING, 863 "SAX.xmlSAX2NotationDecl(%s) externalID or PublicID missing\n", 864 name, NULL); 865 return; 866 } else if (ctxt->inSubset == 1) 867 nota = xmlAddNotationDecl(&ctxt->vctxt, ctxt->myDoc->intSubset, name, 868 publicId, systemId); 869 else if (ctxt->inSubset == 2) 870 nota = xmlAddNotationDecl(&ctxt->vctxt, ctxt->myDoc->extSubset, name, 871 publicId, systemId); 872 else { 873 xmlFatalErrMsg(ctxt, XML_ERR_NOTATION_PROCESSING, 874 "SAX.xmlSAX2NotationDecl(%s) called while not in subset\n", 875 name, NULL); 876 return; 877 } 878 #ifdef LIBXML_VALID_ENABLED 879 if (nota == NULL) ctxt->valid = 0; 880 if ((ctxt->validate) && (ctxt->wellFormed) && 881 (ctxt->myDoc->intSubset != NULL)) 882 ctxt->valid &= xmlValidateNotationDecl(&ctxt->vctxt, ctxt->myDoc, 883 nota); 884 #endif /* LIBXML_VALID_ENABLED */ 885 } 886 887 /** 888 * xmlSAX2UnparsedEntityDecl: 889 * @ctx: the user data (XML parser context) 890 * @name: The name of the entity 891 * @publicId: The public ID of the entity 892 * @systemId: The system ID of the entity 893 * @notationName: the name of the notation 894 * 895 * What to do when an unparsed entity declaration is parsed 896 */ 897 void 898 xmlSAX2UnparsedEntityDecl(void *ctx, const xmlChar *name, 899 const xmlChar *publicId, const xmlChar *systemId, 900 const xmlChar *notationName) 901 { 902 xmlEntityPtr ent; 903 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 904 if (ctx == NULL) return; 905 #ifdef DEBUG_SAX 906 xmlGenericError(xmlGenericErrorContext, 907 "SAX.xmlSAX2UnparsedEntityDecl(%s, %s, %s, %s)\n", 908 name, publicId, systemId, notationName); 909 #endif 910 if (ctxt->inSubset == 1) { 911 ent = xmlAddDocEntity(ctxt->myDoc, name, 912 XML_EXTERNAL_GENERAL_UNPARSED_ENTITY, 913 publicId, systemId, notationName); 914 if ((ent == NULL) && (ctxt->pedantic) && 915 (ctxt->sax != NULL) && (ctxt->sax->warning != NULL)) 916 ctxt->sax->warning(ctxt->userData, 917 "Entity(%s) already defined in the internal subset\n", name); 918 if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) { 919 xmlChar *URI; 920 const char *base = NULL; 921 922 if (ctxt->input != NULL) 923 base = ctxt->input->filename; 924 if (base == NULL) 925 base = ctxt->directory; 926 927 URI = xmlBuildURI(systemId, (const xmlChar *) base); 928 ent->URI = URI; 929 } 930 } else if (ctxt->inSubset == 2) { 931 ent = xmlAddDtdEntity(ctxt->myDoc, name, 932 XML_EXTERNAL_GENERAL_UNPARSED_ENTITY, 933 publicId, systemId, notationName); 934 if ((ent == NULL) && (ctxt->pedantic) && 935 (ctxt->sax != NULL) && (ctxt->sax->warning != NULL)) 936 ctxt->sax->warning(ctxt->userData, 937 "Entity(%s) already defined in the external subset\n", name); 938 if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) { 939 xmlChar *URI; 940 const char *base = NULL; 941 942 if (ctxt->input != NULL) 943 base = ctxt->input->filename; 944 if (base == NULL) 945 base = ctxt->directory; 946 947 URI = xmlBuildURI(systemId, (const xmlChar *) base); 948 ent->URI = URI; 949 } 950 } else { 951 xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR, 952 "SAX.xmlSAX2UnparsedEntityDecl(%s) called while not in subset\n", 953 name, NULL); 954 } 955 } 956 957 /** 958 * xmlSAX2SetDocumentLocator: 959 * @ctx: the user data (XML parser context) 960 * @loc: A SAX Locator 961 * 962 * Receive the document locator at startup, actually xmlDefaultSAXLocator 963 * Everything is available on the context, so this is useless in our case. 964 */ 965 void 966 xmlSAX2SetDocumentLocator(void *ctx ATTRIBUTE_UNUSED, xmlSAXLocatorPtr loc ATTRIBUTE_UNUSED) 967 { 968 /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */ 969 #ifdef DEBUG_SAX 970 xmlGenericError(xmlGenericErrorContext, 971 "SAX.xmlSAX2SetDocumentLocator()\n"); 972 #endif 973 } 974 975 /** 976 * xmlSAX2StartDocument: 977 * @ctx: the user data (XML parser context) 978 * 979 * called when the document start being processed. 980 */ 981 void 982 xmlSAX2StartDocument(void *ctx) 983 { 984 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 985 xmlDocPtr doc; 986 987 if (ctx == NULL) return; 988 989 #ifdef DEBUG_SAX 990 xmlGenericError(xmlGenericErrorContext, 991 "SAX.xmlSAX2StartDocument()\n"); 992 #endif 993 if (ctxt->html) { 994 #ifdef LIBXML_HTML_ENABLED 995 if (ctxt->myDoc == NULL) 996 ctxt->myDoc = htmlNewDocNoDtD(NULL, NULL); 997 ctxt->myDoc->properties = XML_DOC_HTML; 998 ctxt->myDoc->parseFlags = ctxt->options; 999 if (ctxt->myDoc == NULL) { 1000 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument"); 1001 return; 1002 } 1003 #else 1004 xmlGenericError(xmlGenericErrorContext, 1005 "libxml2 built without HTML support\n"); 1006 ctxt->errNo = XML_ERR_INTERNAL_ERROR; 1007 ctxt->instate = XML_PARSER_EOF; 1008 ctxt->disableSAX = 1; 1009 return; 1010 #endif 1011 } else { 1012 doc = ctxt->myDoc = xmlNewDoc(ctxt->version); 1013 if (doc != NULL) { 1014 doc->properties = 0; 1015 if (ctxt->options & XML_PARSE_OLD10) 1016 doc->properties |= XML_DOC_OLD10; 1017 doc->parseFlags = ctxt->options; 1018 if (ctxt->encoding != NULL) 1019 doc->encoding = xmlStrdup(ctxt->encoding); 1020 else 1021 doc->encoding = NULL; 1022 doc->standalone = ctxt->standalone; 1023 } else { 1024 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument"); 1025 return; 1026 } 1027 if ((ctxt->dictNames) && (doc != NULL)) { 1028 doc->dict = ctxt->dict; 1029 xmlDictReference(doc->dict); 1030 } 1031 } 1032 if ((ctxt->myDoc != NULL) && (ctxt->myDoc->URL == NULL) && 1033 (ctxt->input != NULL) && (ctxt->input->filename != NULL)) { 1034 ctxt->myDoc->URL = xmlPathToURI((const xmlChar *)ctxt->input->filename); 1035 if (ctxt->myDoc->URL == NULL) 1036 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument"); 1037 } 1038 } 1039 1040 /** 1041 * xmlSAX2EndDocument: 1042 * @ctx: the user data (XML parser context) 1043 * 1044 * called when the document end has been detected. 1045 */ 1046 void 1047 xmlSAX2EndDocument(void *ctx) 1048 { 1049 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 1050 #ifdef DEBUG_SAX 1051 xmlGenericError(xmlGenericErrorContext, 1052 "SAX.xmlSAX2EndDocument()\n"); 1053 #endif 1054 if (ctx == NULL) return; 1055 #ifdef LIBXML_VALID_ENABLED 1056 if (ctxt->validate && ctxt->wellFormed && 1057 ctxt->myDoc && ctxt->myDoc->intSubset) 1058 ctxt->valid &= xmlValidateDocumentFinal(&ctxt->vctxt, ctxt->myDoc); 1059 #endif /* LIBXML_VALID_ENABLED */ 1060 1061 /* 1062 * Grab the encoding if it was added on-the-fly 1063 */ 1064 if ((ctxt->encoding != NULL) && (ctxt->myDoc != NULL) && 1065 (ctxt->myDoc->encoding == NULL)) { 1066 ctxt->myDoc->encoding = ctxt->encoding; 1067 ctxt->encoding = NULL; 1068 } 1069 if ((ctxt->inputTab != NULL) && 1070 (ctxt->inputNr > 0) && (ctxt->inputTab[0] != NULL) && 1071 (ctxt->inputTab[0]->encoding != NULL) && (ctxt->myDoc != NULL) && 1072 (ctxt->myDoc->encoding == NULL)) { 1073 ctxt->myDoc->encoding = xmlStrdup(ctxt->inputTab[0]->encoding); 1074 } 1075 if ((ctxt->charset != XML_CHAR_ENCODING_NONE) && (ctxt->myDoc != NULL) && 1076 (ctxt->myDoc->charset == XML_CHAR_ENCODING_NONE)) { 1077 ctxt->myDoc->charset = ctxt->charset; 1078 } 1079 } 1080 1081 #if defined(LIBXML_SAX1_ENABLED) || defined(LIBXML_HTML_ENABLED) || defined(LIBXML_WRITER_ENABLED) || defined(LIBXML_DOCB_ENABLED) 1082 /** 1083 * xmlSAX2AttributeInternal: 1084 * @ctx: the user data (XML parser context) 1085 * @fullname: The attribute name, including namespace prefix 1086 * @value: The attribute value 1087 * @prefix: the prefix on the element node 1088 * 1089 * Handle an attribute that has been read by the parser. 1090 * The default handling is to convert the attribute into an 1091 * DOM subtree and past it in a new xmlAttr element added to 1092 * the element. 1093 */ 1094 static void 1095 xmlSAX2AttributeInternal(void *ctx, const xmlChar *fullname, 1096 const xmlChar *value, const xmlChar *prefix ATTRIBUTE_UNUSED) 1097 { 1098 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 1099 xmlAttrPtr ret; 1100 xmlChar *name; 1101 xmlChar *ns; 1102 xmlChar *nval; 1103 xmlNsPtr namespace; 1104 1105 if (ctxt->html) { 1106 name = xmlStrdup(fullname); 1107 ns = NULL; 1108 namespace = NULL; 1109 } else { 1110 /* 1111 * Split the full name into a namespace prefix and the tag name 1112 */ 1113 name = xmlSplitQName(ctxt, fullname, &ns); 1114 if ((name != NULL) && (name[0] == 0)) { 1115 if (xmlStrEqual(ns, BAD_CAST "xmlns")) { 1116 xmlNsErrMsg(ctxt, XML_ERR_NS_DECL_ERROR, 1117 "invalid namespace declaration '%s'\n", 1118 fullname, NULL); 1119 } else { 1120 xmlNsWarnMsg(ctxt, XML_WAR_NS_COLUMN, 1121 "Avoid attribute ending with ':' like '%s'\n", 1122 fullname, NULL); 1123 } 1124 if (ns != NULL) 1125 xmlFree(ns); 1126 ns = NULL; 1127 xmlFree(name); 1128 name = xmlStrdup(fullname); 1129 } 1130 } 1131 if (name == NULL) { 1132 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement"); 1133 if (ns != NULL) 1134 xmlFree(ns); 1135 return; 1136 } 1137 1138 #ifdef LIBXML_HTML_ENABLED 1139 if ((ctxt->html) && 1140 (value == NULL) && (htmlIsBooleanAttr(fullname))) { 1141 nval = xmlStrdup(fullname); 1142 value = (const xmlChar *) nval; 1143 } else 1144 #endif 1145 { 1146 #ifdef LIBXML_VALID_ENABLED 1147 /* 1148 * Do the last stage of the attribute normalization 1149 * Needed for HTML too: 1150 * http://www.w3.org/TR/html4/types.html#h-6.2 1151 */ 1152 ctxt->vctxt.valid = 1; 1153 nval = xmlValidCtxtNormalizeAttributeValue(&ctxt->vctxt, 1154 ctxt->myDoc, ctxt->node, 1155 fullname, value); 1156 if (ctxt->vctxt.valid != 1) { 1157 ctxt->valid = 0; 1158 } 1159 if (nval != NULL) 1160 value = nval; 1161 #else 1162 nval = NULL; 1163 #endif /* LIBXML_VALID_ENABLED */ 1164 } 1165 1166 /* 1167 * Check whether it's a namespace definition 1168 */ 1169 if ((!ctxt->html) && (ns == NULL) && 1170 (name[0] == 'x') && (name[1] == 'm') && (name[2] == 'l') && 1171 (name[3] == 'n') && (name[4] == 's') && (name[5] == 0)) { 1172 xmlNsPtr nsret; 1173 xmlChar *val; 1174 1175 if (!ctxt->replaceEntities) { 1176 ctxt->depth++; 1177 val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF, 1178 0,0,0); 1179 ctxt->depth--; 1180 } else { 1181 val = (xmlChar *) value; 1182 } 1183 1184 if (val[0] != 0) { 1185 xmlURIPtr uri; 1186 1187 uri = xmlParseURI((const char *)val); 1188 if (uri == NULL) { 1189 if ((ctxt->sax != NULL) && (ctxt->sax->warning != NULL)) 1190 ctxt->sax->warning(ctxt->userData, 1191 "xmlns: %s not a valid URI\n", val); 1192 } else { 1193 if (uri->scheme == NULL) { 1194 if ((ctxt->sax != NULL) && (ctxt->sax->warning != NULL)) 1195 ctxt->sax->warning(ctxt->userData, 1196 "xmlns: URI %s is not absolute\n", val); 1197 } 1198 xmlFreeURI(uri); 1199 } 1200 } 1201 1202 /* a default namespace definition */ 1203 nsret = xmlNewNs(ctxt->node, val, NULL); 1204 1205 #ifdef LIBXML_VALID_ENABLED 1206 /* 1207 * Validate also for namespace decls, they are attributes from 1208 * an XML-1.0 perspective 1209 */ 1210 if (nsret != NULL && ctxt->validate && ctxt->wellFormed && 1211 ctxt->myDoc && ctxt->myDoc->intSubset) 1212 ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc, 1213 ctxt->node, prefix, nsret, val); 1214 #endif /* LIBXML_VALID_ENABLED */ 1215 if (name != NULL) 1216 xmlFree(name); 1217 if (nval != NULL) 1218 xmlFree(nval); 1219 if (val != value) 1220 xmlFree(val); 1221 return; 1222 } 1223 if ((!ctxt->html) && 1224 (ns != NULL) && (ns[0] == 'x') && (ns[1] == 'm') && (ns[2] == 'l') && 1225 (ns[3] == 'n') && (ns[4] == 's') && (ns[5] == 0)) { 1226 xmlNsPtr nsret; 1227 xmlChar *val; 1228 1229 if (!ctxt->replaceEntities) { 1230 ctxt->depth++; 1231 val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF, 1232 0,0,0); 1233 ctxt->depth--; 1234 if (val == NULL) { 1235 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement"); 1236 xmlFree(ns); 1237 if (name != NULL) 1238 xmlFree(name); 1239 return; 1240 } 1241 } else { 1242 val = (xmlChar *) value; 1243 } 1244 1245 if (val[0] == 0) { 1246 xmlNsErrMsg(ctxt, XML_NS_ERR_EMPTY, 1247 "Empty namespace name for prefix %s\n", name, NULL); 1248 } 1249 if ((ctxt->pedantic != 0) && (val[0] != 0)) { 1250 xmlURIPtr uri; 1251 1252 uri = xmlParseURI((const char *)val); 1253 if (uri == NULL) { 1254 xmlNsWarnMsg(ctxt, XML_WAR_NS_URI, 1255 "xmlns:%s: %s not a valid URI\n", name, value); 1256 } else { 1257 if (uri->scheme == NULL) { 1258 xmlNsWarnMsg(ctxt, XML_WAR_NS_URI_RELATIVE, 1259 "xmlns:%s: URI %s is not absolute\n", name, value); 1260 } 1261 xmlFreeURI(uri); 1262 } 1263 } 1264 1265 /* a standard namespace definition */ 1266 nsret = xmlNewNs(ctxt->node, val, name); 1267 xmlFree(ns); 1268 #ifdef LIBXML_VALID_ENABLED 1269 /* 1270 * Validate also for namespace decls, they are attributes from 1271 * an XML-1.0 perspective 1272 */ 1273 if (nsret != NULL && ctxt->validate && ctxt->wellFormed && 1274 ctxt->myDoc && ctxt->myDoc->intSubset) 1275 ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc, 1276 ctxt->node, prefix, nsret, value); 1277 #endif /* LIBXML_VALID_ENABLED */ 1278 if (name != NULL) 1279 xmlFree(name); 1280 if (nval != NULL) 1281 xmlFree(nval); 1282 if (val != value) 1283 xmlFree(val); 1284 return; 1285 } 1286 1287 if (ns != NULL) { 1288 namespace = xmlSearchNs(ctxt->myDoc, ctxt->node, ns); 1289 1290 if (namespace == NULL) { 1291 xmlNsErrMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE, 1292 "Namespace prefix %s of attribute %s is not defined\n", 1293 ns, name); 1294 } else { 1295 xmlAttrPtr prop; 1296 1297 prop = ctxt->node->properties; 1298 while (prop != NULL) { 1299 if (prop->ns != NULL) { 1300 if ((xmlStrEqual(name, prop->name)) && 1301 ((namespace == prop->ns) || 1302 (xmlStrEqual(namespace->href, prop->ns->href)))) { 1303 xmlNsErrMsg(ctxt, XML_ERR_ATTRIBUTE_REDEFINED, 1304 "Attribute %s in %s redefined\n", 1305 name, namespace->href); 1306 ctxt->wellFormed = 0; 1307 if (ctxt->recovery == 0) ctxt->disableSAX = 1; 1308 goto error; 1309 } 1310 } 1311 prop = prop->next; 1312 } 1313 } 1314 } else { 1315 namespace = NULL; 1316 } 1317 1318 /* !!!!!! <a toto:arg="" xmlns:toto="http://toto.com"> */ 1319 ret = xmlNewNsPropEatName(ctxt->node, namespace, name, NULL); 1320 1321 if (ret != NULL) { 1322 if ((ctxt->replaceEntities == 0) && (!ctxt->html)) { 1323 xmlNodePtr tmp; 1324 1325 ret->children = xmlStringGetNodeList(ctxt->myDoc, value); 1326 tmp = ret->children; 1327 while (tmp != NULL) { 1328 tmp->parent = (xmlNodePtr) ret; 1329 if (tmp->next == NULL) 1330 ret->last = tmp; 1331 tmp = tmp->next; 1332 } 1333 } else if (value != NULL) { 1334 ret->children = xmlNewDocText(ctxt->myDoc, value); 1335 ret->last = ret->children; 1336 if (ret->children != NULL) 1337 ret->children->parent = (xmlNodePtr) ret; 1338 } 1339 } 1340 1341 #ifdef LIBXML_VALID_ENABLED 1342 if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed && 1343 ctxt->myDoc && ctxt->myDoc->intSubset) { 1344 1345 /* 1346 * If we don't substitute entities, the validation should be 1347 * done on a value with replaced entities anyway. 1348 */ 1349 if (!ctxt->replaceEntities) { 1350 xmlChar *val; 1351 1352 ctxt->depth++; 1353 val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF, 1354 0,0,0); 1355 ctxt->depth--; 1356 1357 if (val == NULL) 1358 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt, 1359 ctxt->myDoc, ctxt->node, ret, value); 1360 else { 1361 xmlChar *nvalnorm; 1362 1363 /* 1364 * Do the last stage of the attribute normalization 1365 * It need to be done twice ... it's an extra burden related 1366 * to the ability to keep xmlSAX2References in attributes 1367 */ 1368 nvalnorm = xmlValidNormalizeAttributeValue(ctxt->myDoc, 1369 ctxt->node, fullname, val); 1370 if (nvalnorm != NULL) { 1371 xmlFree(val); 1372 val = nvalnorm; 1373 } 1374 1375 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt, 1376 ctxt->myDoc, ctxt->node, ret, val); 1377 xmlFree(val); 1378 } 1379 } else { 1380 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt, ctxt->myDoc, 1381 ctxt->node, ret, value); 1382 } 1383 } else 1384 #endif /* LIBXML_VALID_ENABLED */ 1385 if (((ctxt->loadsubset & XML_SKIP_IDS) == 0) && 1386 (((ctxt->replaceEntities == 0) && (ctxt->external != 2)) || 1387 ((ctxt->replaceEntities != 0) && (ctxt->inSubset == 0)))) { 1388 /* 1389 * when validating, the ID registration is done at the attribute 1390 * validation level. Otherwise we have to do specific handling here. 1391 */ 1392 if (xmlStrEqual(fullname, BAD_CAST "xml:id")) { 1393 /* 1394 * Add the xml:id value 1395 * 1396 * Open issue: normalization of the value. 1397 */ 1398 if (xmlValidateNCName(value, 1) != 0) { 1399 xmlErrValid(ctxt, XML_DTD_XMLID_VALUE, 1400 "xml:id : attribute value %s is not an NCName\n", 1401 (const char *) value, NULL); 1402 } 1403 xmlAddID(&ctxt->vctxt, ctxt->myDoc, value, ret); 1404 } else if (xmlIsID(ctxt->myDoc, ctxt->node, ret)) 1405 xmlAddID(&ctxt->vctxt, ctxt->myDoc, value, ret); 1406 else if (xmlIsRef(ctxt->myDoc, ctxt->node, ret)) 1407 xmlAddRef(&ctxt->vctxt, ctxt->myDoc, value, ret); 1408 } 1409 1410 error: 1411 if (nval != NULL) 1412 xmlFree(nval); 1413 if (ns != NULL) 1414 xmlFree(ns); 1415 } 1416 1417 /* 1418 * xmlCheckDefaultedAttributes: 1419 * 1420 * Check defaulted attributes from the DTD 1421 */ 1422 static void 1423 xmlCheckDefaultedAttributes(xmlParserCtxtPtr ctxt, const xmlChar *name, 1424 const xmlChar *prefix, const xmlChar **atts) { 1425 xmlElementPtr elemDecl; 1426 const xmlChar *att; 1427 int internal = 1; 1428 int i; 1429 1430 elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->intSubset, name, prefix); 1431 if (elemDecl == NULL) { 1432 elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->extSubset, name, prefix); 1433 internal = 0; 1434 } 1435 1436 process_external_subset: 1437 1438 if (elemDecl != NULL) { 1439 xmlAttributePtr attr = elemDecl->attributes; 1440 /* 1441 * Check against defaulted attributes from the external subset 1442 * if the document is stamped as standalone 1443 */ 1444 if ((ctxt->myDoc->standalone == 1) && 1445 (ctxt->myDoc->extSubset != NULL) && 1446 (ctxt->validate)) { 1447 while (attr != NULL) { 1448 if ((attr->defaultValue != NULL) && 1449 (xmlGetDtdQAttrDesc(ctxt->myDoc->extSubset, 1450 attr->elem, attr->name, 1451 attr->prefix) == attr) && 1452 (xmlGetDtdQAttrDesc(ctxt->myDoc->intSubset, 1453 attr->elem, attr->name, 1454 attr->prefix) == NULL)) { 1455 xmlChar *fulln; 1456 1457 if (attr->prefix != NULL) { 1458 fulln = xmlStrdup(attr->prefix); 1459 fulln = xmlStrcat(fulln, BAD_CAST ":"); 1460 fulln = xmlStrcat(fulln, attr->name); 1461 } else { 1462 fulln = xmlStrdup(attr->name); 1463 } 1464 if (fulln == NULL) { 1465 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement"); 1466 break; 1467 } 1468 1469 /* 1470 * Check that the attribute is not declared in the 1471 * serialization 1472 */ 1473 att = NULL; 1474 if (atts != NULL) { 1475 i = 0; 1476 att = atts[i]; 1477 while (att != NULL) { 1478 if (xmlStrEqual(att, fulln)) 1479 break; 1480 i += 2; 1481 att = atts[i]; 1482 } 1483 } 1484 if (att == NULL) { 1485 xmlErrValid(ctxt, XML_DTD_STANDALONE_DEFAULTED, 1486 "standalone: attribute %s on %s defaulted from external subset\n", 1487 (const char *)fulln, 1488 (const char *)attr->elem); 1489 } 1490 xmlFree(fulln); 1491 } 1492 attr = attr->nexth; 1493 } 1494 } 1495 1496 /* 1497 * Actually insert defaulted values when needed 1498 */ 1499 attr = elemDecl->attributes; 1500 while (attr != NULL) { 1501 /* 1502 * Make sure that attributes redefinition occuring in the 1503 * internal subset are not overriden by definitions in the 1504 * external subset. 1505 */ 1506 if (attr->defaultValue != NULL) { 1507 /* 1508 * the element should be instantiated in the tree if: 1509 * - this is a namespace prefix 1510 * - the user required for completion in the tree 1511 * like XSLT 1512 * - there isn't already an attribute definition 1513 * in the internal subset overriding it. 1514 */ 1515 if (((attr->prefix != NULL) && 1516 (xmlStrEqual(attr->prefix, BAD_CAST "xmlns"))) || 1517 ((attr->prefix == NULL) && 1518 (xmlStrEqual(attr->name, BAD_CAST "xmlns"))) || 1519 (ctxt->loadsubset & XML_COMPLETE_ATTRS)) { 1520 xmlAttributePtr tst; 1521 1522 tst = xmlGetDtdQAttrDesc(ctxt->myDoc->intSubset, 1523 attr->elem, attr->name, 1524 attr->prefix); 1525 if ((tst == attr) || (tst == NULL)) { 1526 xmlChar fn[50]; 1527 xmlChar *fulln; 1528 1529 fulln = xmlBuildQName(attr->name, attr->prefix, fn, 50); 1530 if (fulln == NULL) { 1531 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement"); 1532 return; 1533 } 1534 1535 /* 1536 * Check that the attribute is not declared in the 1537 * serialization 1538 */ 1539 att = NULL; 1540 if (atts != NULL) { 1541 i = 0; 1542 att = atts[i]; 1543 while (att != NULL) { 1544 if (xmlStrEqual(att, fulln)) 1545 break; 1546 i += 2; 1547 att = atts[i]; 1548 } 1549 } 1550 if (att == NULL) { 1551 xmlSAX2AttributeInternal(ctxt, fulln, 1552 attr->defaultValue, prefix); 1553 } 1554 if ((fulln != fn) && (fulln != attr->name)) 1555 xmlFree(fulln); 1556 } 1557 } 1558 } 1559 attr = attr->nexth; 1560 } 1561 if (internal == 1) { 1562 elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->extSubset, 1563 name, prefix); 1564 internal = 0; 1565 goto process_external_subset; 1566 } 1567 } 1568 } 1569 1570 /** 1571 * xmlSAX2StartElement: 1572 * @ctx: the user data (XML parser context) 1573 * @fullname: The element name, including namespace prefix 1574 * @atts: An array of name/value attributes pairs, NULL terminated 1575 * 1576 * called when an opening tag has been processed. 1577 */ 1578 void 1579 xmlSAX2StartElement(void *ctx, const xmlChar *fullname, const xmlChar **atts) 1580 { 1581 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 1582 xmlNodePtr ret; 1583 xmlNodePtr parent; 1584 xmlNsPtr ns; 1585 xmlChar *name; 1586 xmlChar *prefix; 1587 const xmlChar *att; 1588 const xmlChar *value; 1589 int i; 1590 1591 if ((ctx == NULL) || (fullname == NULL) || (ctxt->myDoc == NULL)) return; 1592 parent = ctxt->node; 1593 #ifdef DEBUG_SAX 1594 xmlGenericError(xmlGenericErrorContext, 1595 "SAX.xmlSAX2StartElement(%s)\n", fullname); 1596 #endif 1597 1598 /* 1599 * First check on validity: 1600 */ 1601 if (ctxt->validate && (ctxt->myDoc->extSubset == NULL) && 1602 ((ctxt->myDoc->intSubset == NULL) || 1603 ((ctxt->myDoc->intSubset->notations == NULL) && 1604 (ctxt->myDoc->intSubset->elements == NULL) && 1605 (ctxt->myDoc->intSubset->attributes == NULL) && 1606 (ctxt->myDoc->intSubset->entities == NULL)))) { 1607 xmlErrValid(ctxt, XML_ERR_NO_DTD, 1608 "Validation failed: no DTD found !", NULL, NULL); 1609 ctxt->validate = 0; 1610 } 1611 1612 1613 /* 1614 * Split the full name into a namespace prefix and the tag name 1615 */ 1616 name = xmlSplitQName(ctxt, fullname, &prefix); 1617 1618 1619 /* 1620 * Note : the namespace resolution is deferred until the end of the 1621 * attributes parsing, since local namespace can be defined as 1622 * an attribute at this level. 1623 */ 1624 ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL, name, NULL); 1625 if (ret == NULL) { 1626 if (prefix != NULL) 1627 xmlFree(prefix); 1628 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement"); 1629 return; 1630 } 1631 if (ctxt->myDoc->children == NULL) { 1632 #ifdef DEBUG_SAX_TREE 1633 xmlGenericError(xmlGenericErrorContext, "Setting %s as root\n", name); 1634 #endif 1635 xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret); 1636 } else if (parent == NULL) { 1637 parent = ctxt->myDoc->children; 1638 } 1639 ctxt->nodemem = -1; 1640 if (ctxt->linenumbers) { 1641 if (ctxt->input != NULL) { 1642 if (ctxt->input->line < 65535) 1643 ret->line = (short) ctxt->input->line; 1644 else 1645 ret->line = 65535; 1646 } 1647 } 1648 1649 /* 1650 * We are parsing a new node. 1651 */ 1652 #ifdef DEBUG_SAX_TREE 1653 xmlGenericError(xmlGenericErrorContext, "pushing(%s)\n", name); 1654 #endif 1655 nodePush(ctxt, ret); 1656 1657 /* 1658 * Link the child element 1659 */ 1660 if (parent != NULL) { 1661 if (parent->type == XML_ELEMENT_NODE) { 1662 #ifdef DEBUG_SAX_TREE 1663 xmlGenericError(xmlGenericErrorContext, 1664 "adding child %s to %s\n", name, parent->name); 1665 #endif 1666 xmlAddChild(parent, ret); 1667 } else { 1668 #ifdef DEBUG_SAX_TREE 1669 xmlGenericError(xmlGenericErrorContext, 1670 "adding sibling %s to ", name); 1671 xmlDebugDumpOneNode(stderr, parent, 0); 1672 #endif 1673 xmlAddSibling(parent, ret); 1674 } 1675 } 1676 1677 /* 1678 * Insert all the defaulted attributes from the DTD especially namespaces 1679 */ 1680 if ((!ctxt->html) && 1681 ((ctxt->myDoc->intSubset != NULL) || 1682 (ctxt->myDoc->extSubset != NULL))) { 1683 xmlCheckDefaultedAttributes(ctxt, name, prefix, atts); 1684 } 1685 1686 /* 1687 * process all the attributes whose name start with "xmlns" 1688 */ 1689 if (atts != NULL) { 1690 i = 0; 1691 att = atts[i++]; 1692 value = atts[i++]; 1693 if (!ctxt->html) { 1694 while ((att != NULL) && (value != NULL)) { 1695 if ((att[0] == 'x') && (att[1] == 'm') && (att[2] == 'l') && 1696 (att[3] == 'n') && (att[4] == 's')) 1697 xmlSAX2AttributeInternal(ctxt, att, value, prefix); 1698 1699 att = atts[i++]; 1700 value = atts[i++]; 1701 } 1702 } 1703 } 1704 1705 /* 1706 * Search the namespace, note that since the attributes have been 1707 * processed, the local namespaces are available. 1708 */ 1709 ns = xmlSearchNs(ctxt->myDoc, ret, prefix); 1710 if ((ns == NULL) && (parent != NULL)) 1711 ns = xmlSearchNs(ctxt->myDoc, parent, prefix); 1712 if ((prefix != NULL) && (ns == NULL)) { 1713 ns = xmlNewNs(ret, NULL, prefix); 1714 xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE, 1715 "Namespace prefix %s is not defined\n", 1716 prefix, NULL); 1717 } 1718 1719 /* 1720 * set the namespace node, making sure that if the default namspace 1721 * is unbound on a parent we simply kee it NULL 1722 */ 1723 if ((ns != NULL) && (ns->href != NULL) && 1724 ((ns->href[0] != 0) || (ns->prefix != NULL))) 1725 xmlSetNs(ret, ns); 1726 1727 /* 1728 * process all the other attributes 1729 */ 1730 if (atts != NULL) { 1731 i = 0; 1732 att = atts[i++]; 1733 value = atts[i++]; 1734 if (ctxt->html) { 1735 while (att != NULL) { 1736 xmlSAX2AttributeInternal(ctxt, att, value, NULL); 1737 att = atts[i++]; 1738 value = atts[i++]; 1739 } 1740 } else { 1741 while ((att != NULL) && (value != NULL)) { 1742 if ((att[0] != 'x') || (att[1] != 'm') || (att[2] != 'l') || 1743 (att[3] != 'n') || (att[4] != 's')) 1744 xmlSAX2AttributeInternal(ctxt, att, value, NULL); 1745 1746 /* 1747 * Next ones 1748 */ 1749 att = atts[i++]; 1750 value = atts[i++]; 1751 } 1752 } 1753 } 1754 1755 #ifdef LIBXML_VALID_ENABLED 1756 /* 1757 * If it's the Document root, finish the DTD validation and 1758 * check the document root element for validity 1759 */ 1760 if ((ctxt->validate) && (ctxt->vctxt.finishDtd == XML_CTXT_FINISH_DTD_0)) { 1761 int chk; 1762 1763 chk = xmlValidateDtdFinal(&ctxt->vctxt, ctxt->myDoc); 1764 if (chk <= 0) 1765 ctxt->valid = 0; 1766 if (chk < 0) 1767 ctxt->wellFormed = 0; 1768 ctxt->valid &= xmlValidateRoot(&ctxt->vctxt, ctxt->myDoc); 1769 ctxt->vctxt.finishDtd = XML_CTXT_FINISH_DTD_1; 1770 } 1771 #endif /* LIBXML_VALID_ENABLED */ 1772 1773 if (prefix != NULL) 1774 xmlFree(prefix); 1775 1776 } 1777 1778 /** 1779 * xmlSAX2EndElement: 1780 * @ctx: the user data (XML parser context) 1781 * @name: The element name 1782 * 1783 * called when the end of an element has been detected. 1784 */ 1785 void 1786 xmlSAX2EndElement(void *ctx, const xmlChar *name ATTRIBUTE_UNUSED) 1787 { 1788 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 1789 xmlNodePtr cur; 1790 1791 if (ctx == NULL) return; 1792 cur = ctxt->node; 1793 #ifdef DEBUG_SAX 1794 if (name == NULL) 1795 xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2EndElement(NULL)\n"); 1796 else 1797 xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2EndElement(%s)\n", name); 1798 #endif 1799 1800 /* Capture end position and add node */ 1801 if (cur != NULL && ctxt->record_info) { 1802 ctxt->nodeInfo->end_pos = ctxt->input->cur - ctxt->input->base; 1803 ctxt->nodeInfo->end_line = ctxt->input->line; 1804 ctxt->nodeInfo->node = cur; 1805 xmlParserAddNodeInfo(ctxt, ctxt->nodeInfo); 1806 } 1807 ctxt->nodemem = -1; 1808 1809 #ifdef LIBXML_VALID_ENABLED 1810 if (ctxt->validate && ctxt->wellFormed && 1811 ctxt->myDoc && ctxt->myDoc->intSubset) 1812 ctxt->valid &= xmlValidateOneElement(&ctxt->vctxt, ctxt->myDoc, 1813 cur); 1814 #endif /* LIBXML_VALID_ENABLED */ 1815 1816 1817 /* 1818 * end of parsing of this node. 1819 */ 1820 #ifdef DEBUG_SAX_TREE 1821 xmlGenericError(xmlGenericErrorContext, "popping(%s)\n", cur->name); 1822 #endif 1823 nodePop(ctxt); 1824 } 1825 #endif /* LIBXML_SAX1_ENABLED || LIBXML_HTML_ENABLE */ 1826 1827 /* 1828 * xmlSAX2TextNode: 1829 * @ctxt: the parser context 1830 * @str: the input string 1831 * @len: the string length 1832 * 1833 * Callback for a text node 1834 * 1835 * Returns the newly allocated string or NULL if not needed or error 1836 */ 1837 static xmlNodePtr 1838 xmlSAX2TextNode(xmlParserCtxtPtr ctxt, const xmlChar *str, int len) { 1839 xmlNodePtr ret; 1840 const xmlChar *intern = NULL; 1841 1842 /* 1843 * Allocate 1844 */ 1845 if (ctxt->freeElems != NULL) { 1846 ret = ctxt->freeElems; 1847 ctxt->freeElems = ret->next; 1848 ctxt->freeElemsNr--; 1849 } else { 1850 ret = (xmlNodePtr) xmlMalloc(sizeof(xmlNode)); 1851 } 1852 if (ret == NULL) { 1853 xmlErrMemory(ctxt, "xmlSAX2Characters"); 1854 return(NULL); 1855 } 1856 memset(ret, 0, sizeof(xmlNode)); 1857 /* 1858 * intern the formatting blanks found between tags, or the 1859 * very short strings 1860 */ 1861 if (ctxt->dictNames) { 1862 xmlChar cur = str[len]; 1863 1864 if ((len < (int) (2 * sizeof(void *))) && 1865 (ctxt->options & XML_PARSE_COMPACT)) { 1866 /* store the string in the node overriding properties and nsDef */ 1867 xmlChar *tmp = (xmlChar *) &(ret->properties); 1868 memcpy(tmp, str, len); 1869 tmp[len] = 0; 1870 intern = tmp; 1871 } else if ((len <= 3) && ((cur == '"') || (cur == '\'') || 1872 ((cur == '<') && (str[len + 1] != '!')))) { 1873 intern = xmlDictLookup(ctxt->dict, str, len); 1874 } else if (IS_BLANK_CH(*str) && (len < 60) && (cur == '<') && 1875 (str[len + 1] != '!')) { 1876 int i; 1877 1878 for (i = 1;i < len;i++) { 1879 if (!IS_BLANK_CH(str[i])) goto skip; 1880 } 1881 intern = xmlDictLookup(ctxt->dict, str, len); 1882 } 1883 } 1884 skip: 1885 ret->type = XML_TEXT_NODE; 1886 1887 ret->name = xmlStringText; 1888 if (intern == NULL) { 1889 ret->content = xmlStrndup(str, len); 1890 if (ret->content == NULL) { 1891 xmlSAX2ErrMemory(ctxt, "xmlSAX2TextNode"); 1892 xmlFree(ret); 1893 return(NULL); 1894 } 1895 } else 1896 ret->content = (xmlChar *) intern; 1897 1898 if (ctxt->linenumbers) { 1899 if (ctxt->input != NULL) { 1900 if (ctxt->input->line < 65535) 1901 ret->line = (short) ctxt->input->line; 1902 else { 1903 ret->line = 65535; 1904 if (ctxt->options & XML_PARSE_BIG_LINES) 1905 ret->psvi = (void *) (long) ctxt->input->line; 1906 } 1907 } 1908 } 1909 1910 if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue)) 1911 xmlRegisterNodeDefaultValue(ret); 1912 return(ret); 1913 } 1914 1915 #ifdef LIBXML_VALID_ENABLED 1916 /* 1917 * xmlSAX2DecodeAttrEntities: 1918 * @ctxt: the parser context 1919 * @str: the input string 1920 * @len: the string length 1921 * 1922 * Remove the entities from an attribute value 1923 * 1924 * Returns the newly allocated string or NULL if not needed or error 1925 */ 1926 static xmlChar * 1927 xmlSAX2DecodeAttrEntities(xmlParserCtxtPtr ctxt, const xmlChar *str, 1928 const xmlChar *end) { 1929 const xmlChar *in; 1930 xmlChar *ret; 1931 1932 in = str; 1933 while (in < end) 1934 if (*in++ == '&') 1935 goto decode; 1936 return(NULL); 1937 decode: 1938 ctxt->depth++; 1939 ret = xmlStringLenDecodeEntities(ctxt, str, end - str, 1940 XML_SUBSTITUTE_REF, 0,0,0); 1941 ctxt->depth--; 1942 return(ret); 1943 } 1944 #endif /* LIBXML_VALID_ENABLED */ 1945 1946 /** 1947 * xmlSAX2AttributeNs: 1948 * @ctx: the user data (XML parser context) 1949 * @localname: the local name of the attribute 1950 * @prefix: the attribute namespace prefix if available 1951 * @URI: the attribute namespace name if available 1952 * @value: Start of the attribute value 1953 * @valueend: end of the attribute value 1954 * 1955 * Handle an attribute that has been read by the parser. 1956 * The default handling is to convert the attribute into an 1957 * DOM subtree and past it in a new xmlAttr element added to 1958 * the element. 1959 */ 1960 static void 1961 xmlSAX2AttributeNs(xmlParserCtxtPtr ctxt, 1962 const xmlChar * localname, 1963 const xmlChar * prefix, 1964 const xmlChar * value, 1965 const xmlChar * valueend) 1966 { 1967 xmlAttrPtr ret; 1968 xmlNsPtr namespace = NULL; 1969 xmlChar *dup = NULL; 1970 1971 /* 1972 * Note: if prefix == NULL, the attribute is not in the default namespace 1973 */ 1974 if (prefix != NULL) 1975 namespace = xmlSearchNs(ctxt->myDoc, ctxt->node, prefix); 1976 1977 /* 1978 * allocate the node 1979 */ 1980 if (ctxt->freeAttrs != NULL) { 1981 ret = ctxt->freeAttrs; 1982 ctxt->freeAttrs = ret->next; 1983 ctxt->freeAttrsNr--; 1984 memset(ret, 0, sizeof(xmlAttr)); 1985 ret->type = XML_ATTRIBUTE_NODE; 1986 1987 ret->parent = ctxt->node; 1988 ret->doc = ctxt->myDoc; 1989 ret->ns = namespace; 1990 1991 if (ctxt->dictNames) 1992 ret->name = localname; 1993 else 1994 ret->name = xmlStrdup(localname); 1995 1996 /* link at the end to preserv order, TODO speed up with a last */ 1997 if (ctxt->node->properties == NULL) { 1998 ctxt->node->properties = ret; 1999 } else { 2000 xmlAttrPtr prev = ctxt->node->properties; 2001 2002 while (prev->next != NULL) prev = prev->next; 2003 prev->next = ret; 2004 ret->prev = prev; 2005 } 2006 2007 if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue)) 2008 xmlRegisterNodeDefaultValue((xmlNodePtr)ret); 2009 } else { 2010 if (ctxt->dictNames) 2011 ret = xmlNewNsPropEatName(ctxt->node, namespace, 2012 (xmlChar *) localname, NULL); 2013 else 2014 ret = xmlNewNsProp(ctxt->node, namespace, localname, NULL); 2015 if (ret == NULL) { 2016 xmlErrMemory(ctxt, "xmlSAX2AttributeNs"); 2017 return; 2018 } 2019 } 2020 2021 if ((ctxt->replaceEntities == 0) && (!ctxt->html)) { 2022 xmlNodePtr tmp; 2023 2024 /* 2025 * We know that if there is an entity reference, then 2026 * the string has been dup'ed and terminates with 0 2027 * otherwise with ' or " 2028 */ 2029 if (*valueend != 0) { 2030 tmp = xmlSAX2TextNode(ctxt, value, valueend - value); 2031 ret->children = tmp; 2032 ret->last = tmp; 2033 if (tmp != NULL) { 2034 tmp->doc = ret->doc; 2035 tmp->parent = (xmlNodePtr) ret; 2036 } 2037 } else { 2038 ret->children = xmlStringLenGetNodeList(ctxt->myDoc, value, 2039 valueend - value); 2040 tmp = ret->children; 2041 while (tmp != NULL) { 2042 tmp->doc = ret->doc; 2043 tmp->parent = (xmlNodePtr) ret; 2044 if (tmp->next == NULL) 2045 ret->last = tmp; 2046 tmp = tmp->next; 2047 } 2048 } 2049 } else if (value != NULL) { 2050 xmlNodePtr tmp; 2051 2052 tmp = xmlSAX2TextNode(ctxt, value, valueend - value); 2053 ret->children = tmp; 2054 ret->last = tmp; 2055 if (tmp != NULL) { 2056 tmp->doc = ret->doc; 2057 tmp->parent = (xmlNodePtr) ret; 2058 } 2059 } 2060 2061 #ifdef LIBXML_VALID_ENABLED 2062 if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed && 2063 ctxt->myDoc && ctxt->myDoc->intSubset) { 2064 /* 2065 * If we don't substitute entities, the validation should be 2066 * done on a value with replaced entities anyway. 2067 */ 2068 if (!ctxt->replaceEntities) { 2069 dup = xmlSAX2DecodeAttrEntities(ctxt, value, valueend); 2070 if (dup == NULL) { 2071 if (*valueend == 0) { 2072 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt, 2073 ctxt->myDoc, ctxt->node, ret, value); 2074 } else { 2075 /* 2076 * That should already be normalized. 2077 * cheaper to finally allocate here than duplicate 2078 * entry points in the full validation code 2079 */ 2080 dup = xmlStrndup(value, valueend - value); 2081 2082 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt, 2083 ctxt->myDoc, ctxt->node, ret, dup); 2084 } 2085 } else { 2086 /* 2087 * dup now contains a string of the flattened attribute 2088 * content with entities substitued. Check if we need to 2089 * apply an extra layer of normalization. 2090 * It need to be done twice ... it's an extra burden related 2091 * to the ability to keep references in attributes 2092 */ 2093 if (ctxt->attsSpecial != NULL) { 2094 xmlChar *nvalnorm; 2095 xmlChar fn[50]; 2096 xmlChar *fullname; 2097 2098 fullname = xmlBuildQName(localname, prefix, fn, 50); 2099 if (fullname != NULL) { 2100 ctxt->vctxt.valid = 1; 2101 nvalnorm = xmlValidCtxtNormalizeAttributeValue( 2102 &ctxt->vctxt, ctxt->myDoc, 2103 ctxt->node, fullname, dup); 2104 if (ctxt->vctxt.valid != 1) 2105 ctxt->valid = 0; 2106 2107 if ((fullname != fn) && (fullname != localname)) 2108 xmlFree(fullname); 2109 if (nvalnorm != NULL) { 2110 xmlFree(dup); 2111 dup = nvalnorm; 2112 } 2113 } 2114 } 2115 2116 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt, 2117 ctxt->myDoc, ctxt->node, ret, dup); 2118 } 2119 } else { 2120 /* 2121 * if entities already have been substitued, then 2122 * the attribute as passed is already normalized 2123 */ 2124 dup = xmlStrndup(value, valueend - value); 2125 2126 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt, 2127 ctxt->myDoc, ctxt->node, ret, dup); 2128 } 2129 } else 2130 #endif /* LIBXML_VALID_ENABLED */ 2131 if (((ctxt->loadsubset & XML_SKIP_IDS) == 0) && 2132 (((ctxt->replaceEntities == 0) && (ctxt->external != 2)) || 2133 ((ctxt->replaceEntities != 0) && (ctxt->inSubset == 0)))) { 2134 /* 2135 * when validating, the ID registration is done at the attribute 2136 * validation level. Otherwise we have to do specific handling here. 2137 */ 2138 if ((prefix == ctxt->str_xml) && 2139 (localname[0] == 'i') && (localname[1] == 'd') && 2140 (localname[2] == 0)) { 2141 /* 2142 * Add the xml:id value 2143 * 2144 * Open issue: normalization of the value. 2145 */ 2146 if (dup == NULL) 2147 dup = xmlStrndup(value, valueend - value); 2148 #ifdef LIBXML_VALID_ENABLED 2149 if (xmlValidateNCName(dup, 1) != 0) { 2150 xmlErrValid(ctxt, XML_DTD_XMLID_VALUE, 2151 "xml:id : attribute value %s is not an NCName\n", 2152 (const char *) dup, NULL); 2153 } 2154 #endif 2155 xmlAddID(&ctxt->vctxt, ctxt->myDoc, dup, ret); 2156 } else if (xmlIsID(ctxt->myDoc, ctxt->node, ret)) { 2157 /* might be worth duplicate entry points and not copy */ 2158 if (dup == NULL) 2159 dup = xmlStrndup(value, valueend - value); 2160 xmlAddID(&ctxt->vctxt, ctxt->myDoc, dup, ret); 2161 } else if (xmlIsRef(ctxt->myDoc, ctxt->node, ret)) { 2162 if (dup == NULL) 2163 dup = xmlStrndup(value, valueend - value); 2164 xmlAddRef(&ctxt->vctxt, ctxt->myDoc, dup, ret); 2165 } 2166 } 2167 if (dup != NULL) 2168 xmlFree(dup); 2169 } 2170 2171 /** 2172 * xmlSAX2StartElementNs: 2173 * @ctx: the user data (XML parser context) 2174 * @localname: the local name of the element 2175 * @prefix: the element namespace prefix if available 2176 * @URI: the element namespace name if available 2177 * @nb_namespaces: number of namespace definitions on that node 2178 * @namespaces: pointer to the array of prefix/URI pairs namespace definitions 2179 * @nb_attributes: the number of attributes on that node 2180 * @nb_defaulted: the number of defaulted attributes. 2181 * @attributes: pointer to the array of (localname/prefix/URI/value/end) 2182 * attribute values. 2183 * 2184 * SAX2 callback when an element start has been detected by the parser. 2185 * It provides the namespace informations for the element, as well as 2186 * the new namespace declarations on the element. 2187 */ 2188 void 2189 xmlSAX2StartElementNs(void *ctx, 2190 const xmlChar *localname, 2191 const xmlChar *prefix, 2192 const xmlChar *URI, 2193 int nb_namespaces, 2194 const xmlChar **namespaces, 2195 int nb_attributes, 2196 int nb_defaulted, 2197 const xmlChar **attributes) 2198 { 2199 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 2200 xmlNodePtr ret; 2201 xmlNodePtr parent; 2202 xmlNsPtr last = NULL, ns; 2203 const xmlChar *uri, *pref; 2204 xmlChar *lname = NULL; 2205 int i, j; 2206 2207 if (ctx == NULL) return; 2208 parent = ctxt->node; 2209 /* 2210 * First check on validity: 2211 */ 2212 if (ctxt->validate && (ctxt->myDoc->extSubset == NULL) && 2213 ((ctxt->myDoc->intSubset == NULL) || 2214 ((ctxt->myDoc->intSubset->notations == NULL) && 2215 (ctxt->myDoc->intSubset->elements == NULL) && 2216 (ctxt->myDoc->intSubset->attributes == NULL) && 2217 (ctxt->myDoc->intSubset->entities == NULL)))) { 2218 xmlErrValid(ctxt, XML_DTD_NO_DTD, 2219 "Validation failed: no DTD found !", NULL, NULL); 2220 ctxt->validate = 0; 2221 } 2222 2223 /* 2224 * Take care of the rare case of an undefined namespace prefix 2225 */ 2226 if ((prefix != NULL) && (URI == NULL)) { 2227 if (ctxt->dictNames) { 2228 const xmlChar *fullname; 2229 2230 fullname = xmlDictQLookup(ctxt->dict, prefix, localname); 2231 if (fullname != NULL) 2232 localname = fullname; 2233 } else { 2234 lname = xmlBuildQName(localname, prefix, NULL, 0); 2235 } 2236 } 2237 /* 2238 * allocate the node 2239 */ 2240 if (ctxt->freeElems != NULL) { 2241 ret = ctxt->freeElems; 2242 ctxt->freeElems = ret->next; 2243 ctxt->freeElemsNr--; 2244 memset(ret, 0, sizeof(xmlNode)); 2245 ret->type = XML_ELEMENT_NODE; 2246 2247 if (ctxt->dictNames) 2248 ret->name = localname; 2249 else { 2250 if (lname == NULL) 2251 ret->name = xmlStrdup(localname); 2252 else 2253 ret->name = lname; 2254 if (ret->name == NULL) { 2255 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs"); 2256 return; 2257 } 2258 } 2259 if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue)) 2260 xmlRegisterNodeDefaultValue(ret); 2261 } else { 2262 if (ctxt->dictNames) 2263 ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL, 2264 (xmlChar *) localname, NULL); 2265 else if (lname == NULL) 2266 ret = xmlNewDocNode(ctxt->myDoc, NULL, localname, NULL); 2267 else 2268 ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL, 2269 (xmlChar *) lname, NULL); 2270 if (ret == NULL) { 2271 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs"); 2272 return; 2273 } 2274 } 2275 if (ctxt->linenumbers) { 2276 if (ctxt->input != NULL) { 2277 if (ctxt->input->line < 65535) 2278 ret->line = (short) ctxt->input->line; 2279 else 2280 ret->line = 65535; 2281 } 2282 } 2283 2284 if (parent == NULL) { 2285 xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret); 2286 } 2287 /* 2288 * Build the namespace list 2289 */ 2290 for (i = 0,j = 0;j < nb_namespaces;j++) { 2291 pref = namespaces[i++]; 2292 uri = namespaces[i++]; 2293 ns = xmlNewNs(NULL, uri, pref); 2294 if (ns != NULL) { 2295 if (last == NULL) { 2296 ret->nsDef = last = ns; 2297 } else { 2298 last->next = ns; 2299 last = ns; 2300 } 2301 if ((URI != NULL) && (prefix == pref)) 2302 ret->ns = ns; 2303 } else { 2304 /* 2305 * any out of memory error would already have been raised 2306 * but we can't be garanteed it's the actual error due to the 2307 * API, best is to skip in this case 2308 */ 2309 continue; 2310 } 2311 #ifdef LIBXML_VALID_ENABLED 2312 if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed && 2313 ctxt->myDoc && ctxt->myDoc->intSubset) { 2314 ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc, 2315 ret, prefix, ns, uri); 2316 } 2317 #endif /* LIBXML_VALID_ENABLED */ 2318 } 2319 ctxt->nodemem = -1; 2320 2321 /* 2322 * We are parsing a new node. 2323 */ 2324 nodePush(ctxt, ret); 2325 2326 /* 2327 * Link the child element 2328 */ 2329 if (parent != NULL) { 2330 if (parent->type == XML_ELEMENT_NODE) { 2331 xmlAddChild(parent, ret); 2332 } else { 2333 xmlAddSibling(parent, ret); 2334 } 2335 } 2336 2337 /* 2338 * Insert the defaulted attributes from the DTD only if requested: 2339 */ 2340 if ((nb_defaulted != 0) && 2341 ((ctxt->loadsubset & XML_COMPLETE_ATTRS) == 0)) 2342 nb_attributes -= nb_defaulted; 2343 2344 /* 2345 * Search the namespace if it wasn't already found 2346 * Note that, if prefix is NULL, this searches for the default Ns 2347 */ 2348 if ((URI != NULL) && (ret->ns == NULL)) { 2349 ret->ns = xmlSearchNs(ctxt->myDoc, parent, prefix); 2350 if ((ret->ns == NULL) && (xmlStrEqual(prefix, BAD_CAST "xml"))) { 2351 ret->ns = xmlSearchNs(ctxt->myDoc, ret, prefix); 2352 } 2353 if (ret->ns == NULL) { 2354 ns = xmlNewNs(ret, NULL, prefix); 2355 if (ns == NULL) { 2356 2357 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs"); 2358 return; 2359 } 2360 if (prefix != NULL) 2361 xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE, 2362 "Namespace prefix %s was not found\n", 2363 prefix, NULL); 2364 else 2365 xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE, 2366 "Namespace default prefix was not found\n", 2367 NULL, NULL); 2368 } 2369 } 2370 2371 /* 2372 * process all the other attributes 2373 */ 2374 if (nb_attributes > 0) { 2375 for (j = 0,i = 0;i < nb_attributes;i++,j+=5) { 2376 /* 2377 * Handle the rare case of an undefined atribute prefix 2378 */ 2379 if ((attributes[j+1] != NULL) && (attributes[j+2] == NULL)) { 2380 if (ctxt->dictNames) { 2381 const xmlChar *fullname; 2382 2383 fullname = xmlDictQLookup(ctxt->dict, attributes[j+1], 2384 attributes[j]); 2385 if (fullname != NULL) { 2386 xmlSAX2AttributeNs(ctxt, fullname, NULL, 2387 attributes[j+3], attributes[j+4]); 2388 continue; 2389 } 2390 } else { 2391 lname = xmlBuildQName(attributes[j], attributes[j+1], 2392 NULL, 0); 2393 if (lname != NULL) { 2394 xmlSAX2AttributeNs(ctxt, lname, NULL, 2395 attributes[j+3], attributes[j+4]); 2396 xmlFree(lname); 2397 continue; 2398 } 2399 } 2400 } 2401 xmlSAX2AttributeNs(ctxt, attributes[j], attributes[j+1], 2402 attributes[j+3], attributes[j+4]); 2403 } 2404 } 2405 2406 #ifdef LIBXML_VALID_ENABLED 2407 /* 2408 * If it's the Document root, finish the DTD validation and 2409 * check the document root element for validity 2410 */ 2411 if ((ctxt->validate) && (ctxt->vctxt.finishDtd == XML_CTXT_FINISH_DTD_0)) { 2412 int chk; 2413 2414 chk = xmlValidateDtdFinal(&ctxt->vctxt, ctxt->myDoc); 2415 if (chk <= 0) 2416 ctxt->valid = 0; 2417 if (chk < 0) 2418 ctxt->wellFormed = 0; 2419 ctxt->valid &= xmlValidateRoot(&ctxt->vctxt, ctxt->myDoc); 2420 ctxt->vctxt.finishDtd = XML_CTXT_FINISH_DTD_1; 2421 } 2422 #endif /* LIBXML_VALID_ENABLED */ 2423 } 2424 2425 /** 2426 * xmlSAX2EndElementNs: 2427 * @ctx: the user data (XML parser context) 2428 * @localname: the local name of the element 2429 * @prefix: the element namespace prefix if available 2430 * @URI: the element namespace name if available 2431 * 2432 * SAX2 callback when an element end has been detected by the parser. 2433 * It provides the namespace informations for the element. 2434 */ 2435 void 2436 xmlSAX2EndElementNs(void *ctx, 2437 const xmlChar * localname ATTRIBUTE_UNUSED, 2438 const xmlChar * prefix ATTRIBUTE_UNUSED, 2439 const xmlChar * URI ATTRIBUTE_UNUSED) 2440 { 2441 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 2442 xmlParserNodeInfo node_info; 2443 xmlNodePtr cur; 2444 2445 if (ctx == NULL) return; 2446 cur = ctxt->node; 2447 /* Capture end position and add node */ 2448 if ((ctxt->record_info) && (cur != NULL)) { 2449 node_info.end_pos = ctxt->input->cur - ctxt->input->base; 2450 node_info.end_line = ctxt->input->line; 2451 node_info.node = cur; 2452 xmlParserAddNodeInfo(ctxt, &node_info); 2453 } 2454 ctxt->nodemem = -1; 2455 2456 #ifdef LIBXML_VALID_ENABLED 2457 if (ctxt->validate && ctxt->wellFormed && 2458 ctxt->myDoc && ctxt->myDoc->intSubset) 2459 ctxt->valid &= xmlValidateOneElement(&ctxt->vctxt, ctxt->myDoc, cur); 2460 #endif /* LIBXML_VALID_ENABLED */ 2461 2462 /* 2463 * end of parsing of this node. 2464 */ 2465 nodePop(ctxt); 2466 } 2467 2468 /** 2469 * xmlSAX2Reference: 2470 * @ctx: the user data (XML parser context) 2471 * @name: The entity name 2472 * 2473 * called when an entity xmlSAX2Reference is detected. 2474 */ 2475 void 2476 xmlSAX2Reference(void *ctx, const xmlChar *name) 2477 { 2478 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 2479 xmlNodePtr ret; 2480 2481 if (ctx == NULL) return; 2482 #ifdef DEBUG_SAX 2483 xmlGenericError(xmlGenericErrorContext, 2484 "SAX.xmlSAX2Reference(%s)\n", name); 2485 #endif 2486 if (name[0] == '#') 2487 ret = xmlNewCharRef(ctxt->myDoc, name); 2488 else 2489 ret = xmlNewReference(ctxt->myDoc, name); 2490 #ifdef DEBUG_SAX_TREE 2491 xmlGenericError(xmlGenericErrorContext, 2492 "add xmlSAX2Reference %s to %s \n", name, ctxt->node->name); 2493 #endif 2494 if (xmlAddChild(ctxt->node, ret) == NULL) { 2495 xmlFreeNode(ret); 2496 } 2497 } 2498 2499 /** 2500 * xmlSAX2Characters: 2501 * @ctx: the user data (XML parser context) 2502 * @ch: a xmlChar string 2503 * @len: the number of xmlChar 2504 * 2505 * receiving some chars from the parser. 2506 */ 2507 void 2508 xmlSAX2Characters(void *ctx, const xmlChar *ch, int len) 2509 { 2510 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 2511 xmlNodePtr lastChild; 2512 2513 if (ctx == NULL) return; 2514 #ifdef DEBUG_SAX 2515 xmlGenericError(xmlGenericErrorContext, 2516 "SAX.xmlSAX2Characters(%.30s, %d)\n", ch, len); 2517 #endif 2518 /* 2519 * Handle the data if any. If there is no child 2520 * add it as content, otherwise if the last child is text, 2521 * concatenate it, else create a new node of type text. 2522 */ 2523 2524 if (ctxt->node == NULL) { 2525 #ifdef DEBUG_SAX_TREE 2526 xmlGenericError(xmlGenericErrorContext, 2527 "add chars: ctxt->node == NULL !\n"); 2528 #endif 2529 return; 2530 } 2531 lastChild = ctxt->node->last; 2532 #ifdef DEBUG_SAX_TREE 2533 xmlGenericError(xmlGenericErrorContext, 2534 "add chars to %s \n", ctxt->node->name); 2535 #endif 2536 2537 /* 2538 * Here we needed an accelerator mechanism in case of very large 2539 * elements. Use an attribute in the structure !!! 2540 */ 2541 if (lastChild == NULL) { 2542 lastChild = xmlSAX2TextNode(ctxt, ch, len); 2543 if (lastChild != NULL) { 2544 ctxt->node->children = lastChild; 2545 ctxt->node->last = lastChild; 2546 lastChild->parent = ctxt->node; 2547 lastChild->doc = ctxt->node->doc; 2548 ctxt->nodelen = len; 2549 ctxt->nodemem = len + 1; 2550 } else { 2551 xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters"); 2552 return; 2553 } 2554 } else { 2555 int coalesceText = (lastChild != NULL) && 2556 (lastChild->type == XML_TEXT_NODE) && 2557 (lastChild->name == xmlStringText); 2558 if ((coalesceText) && (ctxt->nodemem != 0)) { 2559 /* 2560 * The whole point of maintaining nodelen and nodemem, 2561 * xmlTextConcat is too costly, i.e. compute length, 2562 * reallocate a new buffer, move data, append ch. Here 2563 * We try to minimaze realloc() uses and avoid copying 2564 * and recomputing length over and over. 2565 */ 2566 if (lastChild->content == (xmlChar *)&(lastChild->properties)) { 2567 lastChild->content = xmlStrdup(lastChild->content); 2568 lastChild->properties = NULL; 2569 } else if ((ctxt->nodemem == ctxt->nodelen + 1) && 2570 (xmlDictOwns(ctxt->dict, lastChild->content))) { 2571 lastChild->content = xmlStrdup(lastChild->content); 2572 } 2573 if (((size_t)ctxt->nodelen + (size_t)len > XML_MAX_TEXT_LENGTH) && 2574 ((ctxt->options & XML_PARSE_HUGE) == 0)) { 2575 xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters: huge text node"); 2576 return; 2577 } 2578 if ((size_t)ctxt->nodelen > SIZE_T_MAX - (size_t)len || 2579 (size_t)ctxt->nodemem + (size_t)len > SIZE_T_MAX / 2) { 2580 xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters overflow prevented"); 2581 return; 2582 } 2583 if (ctxt->nodelen + len >= ctxt->nodemem) { 2584 xmlChar *newbuf; 2585 size_t size; 2586 2587 size = ctxt->nodemem + len; 2588 size *= 2; 2589 newbuf = (xmlChar *) xmlRealloc(lastChild->content,size); 2590 if (newbuf == NULL) { 2591 xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters"); 2592 return; 2593 } 2594 ctxt->nodemem = size; 2595 lastChild->content = newbuf; 2596 } 2597 memcpy(&lastChild->content[ctxt->nodelen], ch, len); 2598 ctxt->nodelen += len; 2599 lastChild->content[ctxt->nodelen] = 0; 2600 } else if (coalesceText) { 2601 if (xmlTextConcat(lastChild, ch, len)) { 2602 xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters"); 2603 } 2604 if (ctxt->node->children != NULL) { 2605 ctxt->nodelen = xmlStrlen(lastChild->content); 2606 ctxt->nodemem = ctxt->nodelen + 1; 2607 } 2608 } else { 2609 /* Mixed content, first time */ 2610 lastChild = xmlSAX2TextNode(ctxt, ch, len); 2611 if (lastChild != NULL) { 2612 xmlAddChild(ctxt->node, lastChild); 2613 if (ctxt->node->children != NULL) { 2614 ctxt->nodelen = len; 2615 ctxt->nodemem = len + 1; 2616 } 2617 } 2618 } 2619 } 2620 } 2621 2622 /** 2623 * xmlSAX2IgnorableWhitespace: 2624 * @ctx: the user data (XML parser context) 2625 * @ch: a xmlChar string 2626 * @len: the number of xmlChar 2627 * 2628 * receiving some ignorable whitespaces from the parser. 2629 * UNUSED: by default the DOM building will use xmlSAX2Characters 2630 */ 2631 void 2632 xmlSAX2IgnorableWhitespace(void *ctx ATTRIBUTE_UNUSED, const xmlChar *ch ATTRIBUTE_UNUSED, int len ATTRIBUTE_UNUSED) 2633 { 2634 /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */ 2635 #ifdef DEBUG_SAX 2636 xmlGenericError(xmlGenericErrorContext, 2637 "SAX.xmlSAX2IgnorableWhitespace(%.30s, %d)\n", ch, len); 2638 #endif 2639 } 2640 2641 /** 2642 * xmlSAX2ProcessingInstruction: 2643 * @ctx: the user data (XML parser context) 2644 * @target: the target name 2645 * @data: the PI data's 2646 * 2647 * A processing instruction has been parsed. 2648 */ 2649 void 2650 xmlSAX2ProcessingInstruction(void *ctx, const xmlChar *target, 2651 const xmlChar *data) 2652 { 2653 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 2654 xmlNodePtr ret; 2655 xmlNodePtr parent; 2656 2657 if (ctx == NULL) return; 2658 parent = ctxt->node; 2659 #ifdef DEBUG_SAX 2660 xmlGenericError(xmlGenericErrorContext, 2661 "SAX.xmlSAX2ProcessingInstruction(%s, %s)\n", target, data); 2662 #endif 2663 2664 ret = xmlNewDocPI(ctxt->myDoc, target, data); 2665 if (ret == NULL) return; 2666 2667 if (ctxt->linenumbers) { 2668 if (ctxt->input != NULL) { 2669 if (ctxt->input->line < 65535) 2670 ret->line = (short) ctxt->input->line; 2671 else 2672 ret->line = 65535; 2673 } 2674 } 2675 if (ctxt->inSubset == 1) { 2676 xmlAddChild((xmlNodePtr) ctxt->myDoc->intSubset, ret); 2677 return; 2678 } else if (ctxt->inSubset == 2) { 2679 xmlAddChild((xmlNodePtr) ctxt->myDoc->extSubset, ret); 2680 return; 2681 } 2682 if (parent == NULL) { 2683 #ifdef DEBUG_SAX_TREE 2684 xmlGenericError(xmlGenericErrorContext, 2685 "Setting PI %s as root\n", target); 2686 #endif 2687 xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret); 2688 return; 2689 } 2690 if (parent->type == XML_ELEMENT_NODE) { 2691 #ifdef DEBUG_SAX_TREE 2692 xmlGenericError(xmlGenericErrorContext, 2693 "adding PI %s child to %s\n", target, parent->name); 2694 #endif 2695 xmlAddChild(parent, ret); 2696 } else { 2697 #ifdef DEBUG_SAX_TREE 2698 xmlGenericError(xmlGenericErrorContext, 2699 "adding PI %s sibling to ", target); 2700 xmlDebugDumpOneNode(stderr, parent, 0); 2701 #endif 2702 xmlAddSibling(parent, ret); 2703 } 2704 } 2705 2706 /** 2707 * xmlSAX2Comment: 2708 * @ctx: the user data (XML parser context) 2709 * @value: the xmlSAX2Comment content 2710 * 2711 * A xmlSAX2Comment has been parsed. 2712 */ 2713 void 2714 xmlSAX2Comment(void *ctx, const xmlChar *value) 2715 { 2716 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 2717 xmlNodePtr ret; 2718 xmlNodePtr parent; 2719 2720 if (ctx == NULL) return; 2721 parent = ctxt->node; 2722 #ifdef DEBUG_SAX 2723 xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2Comment(%s)\n", value); 2724 #endif 2725 ret = xmlNewDocComment(ctxt->myDoc, value); 2726 if (ret == NULL) return; 2727 if (ctxt->linenumbers) { 2728 if (ctxt->input != NULL) { 2729 if (ctxt->input->line < 65535) 2730 ret->line = (short) ctxt->input->line; 2731 else 2732 ret->line = 65535; 2733 } 2734 } 2735 2736 if (ctxt->inSubset == 1) { 2737 xmlAddChild((xmlNodePtr) ctxt->myDoc->intSubset, ret); 2738 return; 2739 } else if (ctxt->inSubset == 2) { 2740 xmlAddChild((xmlNodePtr) ctxt->myDoc->extSubset, ret); 2741 return; 2742 } 2743 if (parent == NULL) { 2744 #ifdef DEBUG_SAX_TREE 2745 xmlGenericError(xmlGenericErrorContext, 2746 "Setting xmlSAX2Comment as root\n"); 2747 #endif 2748 xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret); 2749 return; 2750 } 2751 if (parent->type == XML_ELEMENT_NODE) { 2752 #ifdef DEBUG_SAX_TREE 2753 xmlGenericError(xmlGenericErrorContext, 2754 "adding xmlSAX2Comment child to %s\n", parent->name); 2755 #endif 2756 xmlAddChild(parent, ret); 2757 } else { 2758 #ifdef DEBUG_SAX_TREE 2759 xmlGenericError(xmlGenericErrorContext, 2760 "adding xmlSAX2Comment sibling to "); 2761 xmlDebugDumpOneNode(stderr, parent, 0); 2762 #endif 2763 xmlAddSibling(parent, ret); 2764 } 2765 } 2766 2767 /** 2768 * xmlSAX2CDataBlock: 2769 * @ctx: the user data (XML parser context) 2770 * @value: The pcdata content 2771 * @len: the block length 2772 * 2773 * called when a pcdata block has been parsed 2774 */ 2775 void 2776 xmlSAX2CDataBlock(void *ctx, const xmlChar *value, int len) 2777 { 2778 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; 2779 xmlNodePtr ret, lastChild; 2780 2781 if (ctx == NULL) return; 2782 #ifdef DEBUG_SAX 2783 xmlGenericError(xmlGenericErrorContext, 2784 "SAX.pcdata(%.10s, %d)\n", value, len); 2785 #endif 2786 lastChild = xmlGetLastChild(ctxt->node); 2787 #ifdef DEBUG_SAX_TREE 2788 xmlGenericError(xmlGenericErrorContext, 2789 "add chars to %s \n", ctxt->node->name); 2790 #endif 2791 if ((lastChild != NULL) && 2792 (lastChild->type == XML_CDATA_SECTION_NODE)) { 2793 xmlTextConcat(lastChild, value, len); 2794 } else { 2795 ret = xmlNewCDataBlock(ctxt->myDoc, value, len); 2796 xmlAddChild(ctxt->node, ret); 2797 } 2798 } 2799 2800 static int xmlSAX2DefaultVersionValue = 2; 2801 2802 #ifdef LIBXML_SAX1_ENABLED 2803 /** 2804 * xmlSAXDefaultVersion: 2805 * @version: the version, 1 or 2 2806 * 2807 * Set the default version of SAX used globally by the library. 2808 * By default, during initialization the default is set to 2. 2809 * Note that it is generally a better coding style to use 2810 * xmlSAXVersion() to set up the version explicitly for a given 2811 * parsing context. 2812 * 2813 * Returns the previous value in case of success and -1 in case of error. 2814 */ 2815 int 2816 xmlSAXDefaultVersion(int version) 2817 { 2818 int ret = xmlSAX2DefaultVersionValue; 2819 2820 if ((version != 1) && (version != 2)) 2821 return(-1); 2822 xmlSAX2DefaultVersionValue = version; 2823 return(ret); 2824 } 2825 #endif /* LIBXML_SAX1_ENABLED */ 2826 2827 /** 2828 * xmlSAXVersion: 2829 * @hdlr: the SAX handler 2830 * @version: the version, 1 or 2 2831 * 2832 * Initialize the default XML SAX handler according to the version 2833 * 2834 * Returns 0 in case of success and -1 in case of error. 2835 */ 2836 int 2837 xmlSAXVersion(xmlSAXHandler *hdlr, int version) 2838 { 2839 if (hdlr == NULL) return(-1); 2840 if (version == 2) { 2841 hdlr->startElement = NULL; 2842 hdlr->endElement = NULL; 2843 hdlr->startElementNs = xmlSAX2StartElementNs; 2844 hdlr->endElementNs = xmlSAX2EndElementNs; 2845 hdlr->serror = NULL; 2846 hdlr->initialized = XML_SAX2_MAGIC; 2847 #ifdef LIBXML_SAX1_ENABLED 2848 } else if (version == 1) { 2849 hdlr->startElement = xmlSAX2StartElement; 2850 hdlr->endElement = xmlSAX2EndElement; 2851 hdlr->initialized = 1; 2852 #endif /* LIBXML_SAX1_ENABLED */ 2853 } else 2854 return(-1); 2855 hdlr->internalSubset = xmlSAX2InternalSubset; 2856 hdlr->externalSubset = xmlSAX2ExternalSubset; 2857 hdlr->isStandalone = xmlSAX2IsStandalone; 2858 hdlr->hasInternalSubset = xmlSAX2HasInternalSubset; 2859 hdlr->hasExternalSubset = xmlSAX2HasExternalSubset; 2860 hdlr->resolveEntity = xmlSAX2ResolveEntity; 2861 hdlr->getEntity = xmlSAX2GetEntity; 2862 hdlr->getParameterEntity = xmlSAX2GetParameterEntity; 2863 hdlr->entityDecl = xmlSAX2EntityDecl; 2864 hdlr->attributeDecl = xmlSAX2AttributeDecl; 2865 hdlr->elementDecl = xmlSAX2ElementDecl; 2866 hdlr->notationDecl = xmlSAX2NotationDecl; 2867 hdlr->unparsedEntityDecl = xmlSAX2UnparsedEntityDecl; 2868 hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator; 2869 hdlr->startDocument = xmlSAX2StartDocument; 2870 hdlr->endDocument = xmlSAX2EndDocument; 2871 hdlr->reference = xmlSAX2Reference; 2872 hdlr->characters = xmlSAX2Characters; 2873 hdlr->cdataBlock = xmlSAX2CDataBlock; 2874 hdlr->ignorableWhitespace = xmlSAX2Characters; 2875 hdlr->processingInstruction = xmlSAX2ProcessingInstruction; 2876 hdlr->comment = xmlSAX2Comment; 2877 hdlr->warning = xmlParserWarning; 2878 hdlr->error = xmlParserError; 2879 hdlr->fatalError = xmlParserError; 2880 2881 return(0); 2882 } 2883 2884 /** 2885 * xmlSAX2InitDefaultSAXHandler: 2886 * @hdlr: the SAX handler 2887 * @warning: flag if non-zero sets the handler warning procedure 2888 * 2889 * Initialize the default XML SAX2 handler 2890 */ 2891 void 2892 xmlSAX2InitDefaultSAXHandler(xmlSAXHandler *hdlr, int warning) 2893 { 2894 if ((hdlr == NULL) || (hdlr->initialized != 0)) 2895 return; 2896 2897 xmlSAXVersion(hdlr, xmlSAX2DefaultVersionValue); 2898 if (warning == 0) 2899 hdlr->warning = NULL; 2900 else 2901 hdlr->warning = xmlParserWarning; 2902 } 2903 2904 /** 2905 * xmlDefaultSAXHandlerInit: 2906 * 2907 * Initialize the default SAX2 handler 2908 */ 2909 void 2910 xmlDefaultSAXHandlerInit(void) 2911 { 2912 #ifdef LIBXML_SAX1_ENABLED 2913 xmlSAXVersion((xmlSAXHandlerPtr) &xmlDefaultSAXHandler, 1); 2914 #endif /* LIBXML_SAX1_ENABLED */ 2915 } 2916 2917 #ifdef LIBXML_HTML_ENABLED 2918 2919 /** 2920 * xmlSAX2InitHtmlDefaultSAXHandler: 2921 * @hdlr: the SAX handler 2922 * 2923 * Initialize the default HTML SAX2 handler 2924 */ 2925 void 2926 xmlSAX2InitHtmlDefaultSAXHandler(xmlSAXHandler *hdlr) 2927 { 2928 if ((hdlr == NULL) || (hdlr->initialized != 0)) 2929 return; 2930 2931 hdlr->internalSubset = xmlSAX2InternalSubset; 2932 hdlr->externalSubset = NULL; 2933 hdlr->isStandalone = NULL; 2934 hdlr->hasInternalSubset = NULL; 2935 hdlr->hasExternalSubset = NULL; 2936 hdlr->resolveEntity = NULL; 2937 hdlr->getEntity = xmlSAX2GetEntity; 2938 hdlr->getParameterEntity = NULL; 2939 hdlr->entityDecl = NULL; 2940 hdlr->attributeDecl = NULL; 2941 hdlr->elementDecl = NULL; 2942 hdlr->notationDecl = NULL; 2943 hdlr->unparsedEntityDecl = NULL; 2944 hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator; 2945 hdlr->startDocument = xmlSAX2StartDocument; 2946 hdlr->endDocument = xmlSAX2EndDocument; 2947 hdlr->startElement = xmlSAX2StartElement; 2948 hdlr->endElement = xmlSAX2EndElement; 2949 hdlr->reference = NULL; 2950 hdlr->characters = xmlSAX2Characters; 2951 hdlr->cdataBlock = xmlSAX2CDataBlock; 2952 hdlr->ignorableWhitespace = xmlSAX2IgnorableWhitespace; 2953 hdlr->processingInstruction = xmlSAX2ProcessingInstruction; 2954 hdlr->comment = xmlSAX2Comment; 2955 hdlr->warning = xmlParserWarning; 2956 hdlr->error = xmlParserError; 2957 hdlr->fatalError = xmlParserError; 2958 2959 hdlr->initialized = 1; 2960 } 2961 2962 /** 2963 * htmlDefaultSAXHandlerInit: 2964 * 2965 * Initialize the default SAX handler 2966 */ 2967 void 2968 htmlDefaultSAXHandlerInit(void) 2969 { 2970 xmlSAX2InitHtmlDefaultSAXHandler((xmlSAXHandlerPtr) &htmlDefaultSAXHandler); 2971 } 2972 2973 #endif /* LIBXML_HTML_ENABLED */ 2974 2975 #ifdef LIBXML_DOCB_ENABLED 2976 2977 /** 2978 * xmlSAX2InitDocbDefaultSAXHandler: 2979 * @hdlr: the SAX handler 2980 * 2981 * Initialize the default DocBook SAX2 handler 2982 */ 2983 void 2984 xmlSAX2InitDocbDefaultSAXHandler(xmlSAXHandler *hdlr) 2985 { 2986 if ((hdlr == NULL) || (hdlr->initialized != 0)) 2987 return; 2988 2989 hdlr->internalSubset = xmlSAX2InternalSubset; 2990 hdlr->externalSubset = NULL; 2991 hdlr->isStandalone = xmlSAX2IsStandalone; 2992 hdlr->hasInternalSubset = xmlSAX2HasInternalSubset; 2993 hdlr->hasExternalSubset = xmlSAX2HasExternalSubset; 2994 hdlr->resolveEntity = xmlSAX2ResolveEntity; 2995 hdlr->getEntity = xmlSAX2GetEntity; 2996 hdlr->getParameterEntity = NULL; 2997 hdlr->entityDecl = xmlSAX2EntityDecl; 2998 hdlr->attributeDecl = NULL; 2999 hdlr->elementDecl = NULL; 3000 hdlr->notationDecl = NULL; 3001 hdlr->unparsedEntityDecl = NULL; 3002 hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator; 3003 hdlr->startDocument = xmlSAX2StartDocument; 3004 hdlr->endDocument = xmlSAX2EndDocument; 3005 hdlr->startElement = xmlSAX2StartElement; 3006 hdlr->endElement = xmlSAX2EndElement; 3007 hdlr->reference = xmlSAX2Reference; 3008 hdlr->characters = xmlSAX2Characters; 3009 hdlr->cdataBlock = NULL; 3010 hdlr->ignorableWhitespace = xmlSAX2IgnorableWhitespace; 3011 hdlr->processingInstruction = NULL; 3012 hdlr->comment = xmlSAX2Comment; 3013 hdlr->warning = xmlParserWarning; 3014 hdlr->error = xmlParserError; 3015 hdlr->fatalError = xmlParserError; 3016 3017 hdlr->initialized = 1; 3018 } 3019 3020 /** 3021 * docbDefaultSAXHandlerInit: 3022 * 3023 * Initialize the default SAX handler 3024 */ 3025 void 3026 docbDefaultSAXHandlerInit(void) 3027 { 3028 xmlSAX2InitDocbDefaultSAXHandler((xmlSAXHandlerPtr) &docbDefaultSAXHandler); 3029 } 3030 3031 #endif /* LIBXML_DOCB_ENABLED */ 3032 #define bottom_SAX2 3033 #include "elfgcchack.h" 3034