2 * SAX2.c : Default SAX2 handler to build a tree.
4 * See Copyright for the status of this software.
6 * Daniel Veillard <daniel@veillard.com>
15 #include <libxml/xmlmemory.h>
16 #include <libxml/tree.h>
17 #include <libxml/parser.h>
18 #include <libxml/parserInternals.h>
19 #include <libxml/valid.h>
20 #include <libxml/entities.h>
21 #include <libxml/xmlerror.h>
22 #include <libxml/debugXML.h>
23 #include <libxml/xmlIO.h>
24 #include <libxml/SAX.h>
25 #include <libxml/uri.h>
26 #include <libxml/valid.h>
27 #include <libxml/HTMLtree.h>
28 #include <libxml/globals.h>
30 /* Define SIZE_T_MAX unless defined through <limits.h>. */
32 # define SIZE_T_MAX ((size_t)-1)
33 #endif /* !SIZE_T_MAX */
35 /* #define DEBUG_SAX2 */
36 /* #define DEBUG_SAX2_TREE */
41 * macro to flag unimplemented blocks
42 * XML_CATALOG_PREFER user env to select between system/public prefered
43 * option. C.f. Richard Tobin <richard@cogsci.ed.ac.uk>
44 *> Just FYI, I am using an environment variable XML_CATALOG_PREFER with
45 *> values "system" and "public". I have made the default be "system" to
49 xmlGenericError(xmlGenericErrorContext, \
50 "Unimplemented block at %s:%d\n", \
55 * @ctxt: an XML validation parser context
56 * @msg: a string to accompany the error message
59 xmlSAX2ErrMemory(xmlParserCtxtPtr ctxt, const char *msg) {
60 xmlStructuredErrorFunc schannel = NULL;
61 const char *str1 = "out of memory\n";
64 ctxt->errNo = XML_ERR_NO_MEMORY;
65 if ((ctxt->sax != NULL) && (ctxt->sax->initialized == XML_SAX2_MAGIC))
66 schannel = ctxt->sax->serror;
67 __xmlRaiseError(schannel,
68 ctxt->vctxt.error, ctxt->vctxt.userData,
69 ctxt, NULL, XML_FROM_PARSER, XML_ERR_NO_MEMORY,
70 XML_ERR_ERROR, NULL, 0, (const char *) str1,
72 msg, (const char *) str1, NULL);
73 ctxt->errNo = XML_ERR_NO_MEMORY;
74 ctxt->instate = XML_PARSER_EOF;
77 __xmlRaiseError(schannel,
79 ctxt, NULL, XML_FROM_PARSER, XML_ERR_NO_MEMORY,
80 XML_ERR_ERROR, NULL, 0, (const char *) str1,
82 msg, (const char *) str1, NULL);
88 * @ctxt: an XML validation parser context
89 * @error: the error number
90 * @msg: the error message
94 * Handle a validation error
97 xmlErrValid(xmlParserCtxtPtr ctxt, xmlParserErrors error,
98 const char *msg, const char *str1, const char *str2)
100 xmlStructuredErrorFunc schannel = NULL;
102 if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
103 (ctxt->instate == XML_PARSER_EOF))
107 if ((ctxt->sax != NULL) && (ctxt->sax->initialized == XML_SAX2_MAGIC))
108 schannel = ctxt->sax->serror;
109 __xmlRaiseError(schannel,
110 ctxt->vctxt.error, ctxt->vctxt.userData,
111 ctxt, NULL, XML_FROM_DTD, error,
112 XML_ERR_ERROR, NULL, 0, (const char *) str1,
113 (const char *) str2, NULL, 0, 0,
114 msg, (const char *) str1, (const char *) str2);
117 __xmlRaiseError(schannel,
119 ctxt, NULL, XML_FROM_DTD, error,
120 XML_ERR_ERROR, NULL, 0, (const char *) str1,
121 (const char *) str2, NULL, 0, 0,
122 msg, (const char *) str1, (const char *) str2);
128 * @ctxt: an XML parser context
129 * @error: the error number
130 * @msg: the error message
131 * @str1: an error string
132 * @str2: an error string
134 * Handle a fatal parser error, i.e. violating Well-Formedness constraints
137 xmlFatalErrMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
138 const char *msg, const xmlChar *str1, const xmlChar *str2)
140 if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
141 (ctxt->instate == XML_PARSER_EOF))
145 __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER, error,
146 XML_ERR_FATAL, NULL, 0,
147 (const char *) str1, (const char *) str2,
148 NULL, 0, 0, msg, str1, str2);
150 ctxt->wellFormed = 0;
152 if (ctxt->recovery == 0)
153 ctxt->disableSAX = 1;
159 * @ctxt: an XML parser context
160 * @error: the error number
161 * @msg: the error message
162 * @str1: an error string
163 * @str2: an error string
165 * Handle a parser warning
168 xmlWarnMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
169 const char *msg, const xmlChar *str1)
171 if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
172 (ctxt->instate == XML_PARSER_EOF))
176 __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER, error,
177 XML_ERR_WARNING, NULL, 0,
178 (const char *) str1, NULL,
179 NULL, 0, 0, msg, str1);
184 * @ctxt: an XML parser context
185 * @error: the error number
186 * @msg: the error message
187 * @str1: an error string
188 * @str2: an error string
190 * Handle a namespace error
193 xmlNsErrMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
194 const char *msg, const xmlChar *str1, const xmlChar *str2)
196 if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
197 (ctxt->instate == XML_PARSER_EOF))
201 __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_NAMESPACE, error,
202 XML_ERR_ERROR, NULL, 0,
203 (const char *) str1, (const char *) str2,
204 NULL, 0, 0, msg, str1, str2);
209 * @ctxt: an XML parser context
210 * @error: the error number
211 * @msg: the error message
212 * @str1: an error string
214 * Handle a namespace warning
217 xmlNsWarnMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
218 const char *msg, const xmlChar *str1, const xmlChar *str2)
220 if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
221 (ctxt->instate == XML_PARSER_EOF))
225 __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_NAMESPACE, error,
226 XML_ERR_WARNING, NULL, 0,
227 (const char *) str1, (const char *) str2,
228 NULL, 0, 0, msg, str1, str2);
232 * xmlSAX2GetPublicId:
233 * @ctx: the user data (XML parser context)
235 * Provides the public ID e.g. "-//SGMLSOURCE//DTD DEMO//EN"
237 * Returns a xmlChar *
240 xmlSAX2GetPublicId(void *ctx ATTRIBUTE_UNUSED)
242 /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
247 * xmlSAX2GetSystemId:
248 * @ctx: the user data (XML parser context)
250 * Provides the system ID, basically URL or filename e.g.
251 * http://www.sgmlsource.com/dtds/memo.dtd
253 * Returns a xmlChar *
256 xmlSAX2GetSystemId(void *ctx)
258 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
259 if ((ctx == NULL) || (ctxt->input == NULL)) return(NULL);
260 return((const xmlChar *) ctxt->input->filename);
264 * xmlSAX2GetLineNumber:
265 * @ctx: the user data (XML parser context)
267 * Provide the line number of the current parsing point.
272 xmlSAX2GetLineNumber(void *ctx)
274 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
275 if ((ctx == NULL) || (ctxt->input == NULL)) return(0);
276 return(ctxt->input->line);
280 * xmlSAX2GetColumnNumber:
281 * @ctx: the user data (XML parser context)
283 * Provide the column number of the current parsing point.
288 xmlSAX2GetColumnNumber(void *ctx)
290 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
291 if ((ctx == NULL) || (ctxt->input == NULL)) return(0);
292 return(ctxt->input->col);
296 * xmlSAX2IsStandalone:
297 * @ctx: the user data (XML parser context)
299 * Is this document tagged standalone ?
304 xmlSAX2IsStandalone(void *ctx)
306 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
307 if ((ctx == NULL) || (ctxt->myDoc == NULL)) return(0);
308 return(ctxt->myDoc->standalone == 1);
312 * xmlSAX2HasInternalSubset:
313 * @ctx: the user data (XML parser context)
315 * Does this document has an internal subset
320 xmlSAX2HasInternalSubset(void *ctx)
322 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
323 if ((ctxt == NULL) || (ctxt->myDoc == NULL)) return(0);
324 return(ctxt->myDoc->intSubset != NULL);
328 * xmlSAX2HasExternalSubset:
329 * @ctx: the user data (XML parser context)
331 * Does this document has an external subset
336 xmlSAX2HasExternalSubset(void *ctx)
338 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
339 if ((ctxt == NULL) || (ctxt->myDoc == NULL)) return(0);
340 return(ctxt->myDoc->extSubset != NULL);
344 * xmlSAX2InternalSubset:
345 * @ctx: the user data (XML parser context)
346 * @name: the root element name
347 * @ExternalID: the external ID
348 * @SystemID: the SYSTEM ID (e.g. filename or URL)
350 * Callback on internal subset declaration.
353 xmlSAX2InternalSubset(void *ctx, const xmlChar *name,
354 const xmlChar *ExternalID, const xmlChar *SystemID)
356 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
358 if (ctx == NULL) return;
360 xmlGenericError(xmlGenericErrorContext,
361 "SAX.xmlSAX2InternalSubset(%s, %s, %s)\n",
362 name, ExternalID, SystemID);
365 if (ctxt->myDoc == NULL)
367 dtd = xmlGetIntSubset(ctxt->myDoc);
371 xmlUnlinkNode((xmlNodePtr) dtd);
373 ctxt->myDoc->intSubset = NULL;
375 ctxt->myDoc->intSubset =
376 xmlCreateIntSubset(ctxt->myDoc, name, ExternalID, SystemID);
377 if (ctxt->myDoc->intSubset == NULL)
378 xmlSAX2ErrMemory(ctxt, "xmlSAX2InternalSubset");
382 * xmlSAX2ExternalSubset:
383 * @ctx: the user data (XML parser context)
384 * @name: the root element name
385 * @ExternalID: the external ID
386 * @SystemID: the SYSTEM ID (e.g. filename or URL)
388 * Callback on external subset declaration.
391 xmlSAX2ExternalSubset(void *ctx, const xmlChar *name,
392 const xmlChar *ExternalID, const xmlChar *SystemID)
394 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
395 if (ctx == NULL) return;
397 xmlGenericError(xmlGenericErrorContext,
398 "SAX.xmlSAX2ExternalSubset(%s, %s, %s)\n",
399 name, ExternalID, SystemID);
401 if (((ExternalID != NULL) || (SystemID != NULL)) &&
402 (((ctxt->validate) || (ctxt->loadsubset != 0)) &&
403 (ctxt->wellFormed && ctxt->myDoc))) {
405 * Try to fetch and parse the external subset.
407 xmlParserInputPtr oldinput;
410 xmlParserInputPtr *oldinputTab;
411 xmlParserInputPtr input = NULL;
414 const xmlChar *oldencoding;
417 * Ask the Entity resolver to load the damn thing
419 if ((ctxt->sax != NULL) && (ctxt->sax->resolveEntity != NULL))
420 input = ctxt->sax->resolveEntity(ctxt->userData, ExternalID,
426 xmlNewDtd(ctxt->myDoc, name, ExternalID, SystemID);
429 * make sure we won't destroy the main document context
431 oldinput = ctxt->input;
432 oldinputNr = ctxt->inputNr;
433 oldinputMax = ctxt->inputMax;
434 oldinputTab = ctxt->inputTab;
435 oldcharset = ctxt->charset;
436 oldencoding = ctxt->encoding;
437 ctxt->encoding = NULL;
439 ctxt->inputTab = (xmlParserInputPtr *)
440 xmlMalloc(5 * sizeof(xmlParserInputPtr));
441 if (ctxt->inputTab == NULL) {
442 xmlSAX2ErrMemory(ctxt, "xmlSAX2ExternalSubset");
443 ctxt->input = oldinput;
444 ctxt->inputNr = oldinputNr;
445 ctxt->inputMax = oldinputMax;
446 ctxt->inputTab = oldinputTab;
447 ctxt->charset = oldcharset;
448 ctxt->encoding = oldencoding;
454 xmlPushInput(ctxt, input);
457 * On the fly encoding conversion if needed
459 if (ctxt->input->length >= 4) {
460 enc = xmlDetectCharEncoding(ctxt->input->cur, 4);
461 xmlSwitchEncoding(ctxt, enc);
464 if (input->filename == NULL)
465 input->filename = (char *) xmlCanonicPath(SystemID);
468 input->base = ctxt->input->cur;
469 input->cur = ctxt->input->cur;
473 * let's parse that entity knowing it's an external subset.
475 xmlParseExternalSubset(ctxt, ExternalID, SystemID);
478 * Free up the external entities
481 while (ctxt->inputNr > 1)
483 xmlFreeInputStream(ctxt->input);
484 xmlFree(ctxt->inputTab);
487 * Restore the parsing context of the main entity
489 ctxt->input = oldinput;
490 ctxt->inputNr = oldinputNr;
491 ctxt->inputMax = oldinputMax;
492 ctxt->inputTab = oldinputTab;
493 ctxt->charset = oldcharset;
494 if ((ctxt->encoding != NULL) &&
495 ((ctxt->dict == NULL) ||
496 (!xmlDictOwns(ctxt->dict, ctxt->encoding))))
497 xmlFree((xmlChar *) ctxt->encoding);
498 ctxt->encoding = oldencoding;
499 /* ctxt->wellFormed = oldwellFormed; */
504 * xmlSAX2ResolveEntity:
505 * @ctx: the user data (XML parser context)
506 * @publicId: The public ID of the entity
507 * @systemId: The system ID of the entity
509 * The entity loader, to control the loading of external entities,
510 * the application can either:
511 * - override this xmlSAX2ResolveEntity() callback in the SAX block
512 * - or better use the xmlSetExternalEntityLoader() function to
513 * set up it's own entity resolution routine
515 * Returns the xmlParserInputPtr if inlined or NULL for DOM behaviour.
518 xmlSAX2ResolveEntity(void *ctx, const xmlChar *publicId, const xmlChar *systemId)
520 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
521 xmlParserInputPtr ret;
523 const char *base = NULL;
525 if (ctx == NULL) return(NULL);
526 if (ctxt->input != NULL)
527 base = ctxt->input->filename;
529 base = ctxt->directory;
531 URI = xmlBuildURI(systemId, (const xmlChar *) base);
534 xmlGenericError(xmlGenericErrorContext,
535 "SAX.xmlSAX2ResolveEntity(%s, %s)\n", publicId, systemId);
538 ret = xmlLoadExternalEntity((const char *) URI,
539 (const char *) publicId, ctxt);
547 * @ctx: the user data (XML parser context)
548 * @name: The entity name
550 * Get an entity by name
552 * Returns the xmlEntityPtr if found.
555 xmlSAX2GetEntity(void *ctx, const xmlChar *name)
557 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
558 xmlEntityPtr ret = NULL;
560 if (ctx == NULL) return(NULL);
562 xmlGenericError(xmlGenericErrorContext,
563 "SAX.xmlSAX2GetEntity(%s)\n", name);
566 if (ctxt->inSubset == 0) {
567 ret = xmlGetPredefinedEntity(name);
571 if ((ctxt->myDoc != NULL) && (ctxt->myDoc->standalone == 1)) {
572 if (ctxt->inSubset == 2) {
573 ctxt->myDoc->standalone = 0;
574 ret = xmlGetDocEntity(ctxt->myDoc, name);
575 ctxt->myDoc->standalone = 1;
577 ret = xmlGetDocEntity(ctxt->myDoc, name);
579 ctxt->myDoc->standalone = 0;
580 ret = xmlGetDocEntity(ctxt->myDoc, name);
582 xmlFatalErrMsg(ctxt, XML_ERR_NOT_STANDALONE,
583 "Entity(%s) document marked standalone but requires external subset\n",
586 ctxt->myDoc->standalone = 1;
590 ret = xmlGetDocEntity(ctxt->myDoc, name);
593 ((ctxt->validate) || (ctxt->replaceEntities)) &&
594 (ret->children == NULL) &&
595 (ret->etype == XML_EXTERNAL_GENERAL_PARSED_ENTITY)) {
599 * for validation purposes we really need to fetch and
600 * parse the external entity
603 unsigned long oldnbent = ctxt->nbentities;
605 val = xmlParseCtxtExternalEntity(ctxt, ret->URI,
606 ret->ExternalID, &children);
608 xmlAddChildList((xmlNodePtr) ret, children);
610 xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_PROCESSING,
611 "Failure to process entity %s\n", name, NULL);
616 if (ret->checked == 0) {
617 ret->checked = (ctxt->nbentities - oldnbent + 1) * 2;
618 if ((ret->content != NULL) && (xmlStrchr(ret->content, '<')))
626 * xmlSAX2GetParameterEntity:
627 * @ctx: the user data (XML parser context)
628 * @name: The entity name
630 * Get a parameter entity by name
632 * Returns the xmlEntityPtr if found.
635 xmlSAX2GetParameterEntity(void *ctx, const xmlChar *name)
637 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
640 if (ctx == NULL) return(NULL);
642 xmlGenericError(xmlGenericErrorContext,
643 "SAX.xmlSAX2GetParameterEntity(%s)\n", name);
646 ret = xmlGetParameterEntity(ctxt->myDoc, name);
653 * @ctx: the user data (XML parser context)
654 * @name: the entity name
655 * @type: the entity type
656 * @publicId: The public ID of the entity
657 * @systemId: The system ID of the entity
658 * @content: the entity value (without processing).
660 * An entity definition has been parsed
663 xmlSAX2EntityDecl(void *ctx, const xmlChar *name, int type,
664 const xmlChar *publicId, const xmlChar *systemId, xmlChar *content)
667 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
669 if (ctx == NULL) return;
671 xmlGenericError(xmlGenericErrorContext,
672 "SAX.xmlSAX2EntityDecl(%s, %d, %s, %s, %s)\n",
673 name, type, publicId, systemId, content);
675 if (ctxt->inSubset == 1) {
676 ent = xmlAddDocEntity(ctxt->myDoc, name, type, publicId,
678 if ((ent == NULL) && (ctxt->pedantic))
679 xmlWarnMsg(ctxt, XML_WAR_ENTITY_REDEFINED,
680 "Entity(%s) already defined in the internal subset\n",
682 if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
684 const char *base = NULL;
686 if (ctxt->input != NULL)
687 base = ctxt->input->filename;
689 base = ctxt->directory;
691 URI = xmlBuildURI(systemId, (const xmlChar *) base);
694 } else if (ctxt->inSubset == 2) {
695 ent = xmlAddDtdEntity(ctxt->myDoc, name, type, publicId,
697 if ((ent == NULL) && (ctxt->pedantic) &&
698 (ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
699 ctxt->sax->warning(ctxt->userData,
700 "Entity(%s) already defined in the external subset\n", name);
701 if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
703 const char *base = NULL;
705 if (ctxt->input != NULL)
706 base = ctxt->input->filename;
708 base = ctxt->directory;
710 URI = xmlBuildURI(systemId, (const xmlChar *) base);
714 xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_PROCESSING,
715 "SAX.xmlSAX2EntityDecl(%s) called while not in subset\n",
721 * xmlSAX2AttributeDecl:
722 * @ctx: the user data (XML parser context)
723 * @elem: the name of the element
724 * @fullname: the attribute name
725 * @type: the attribute type
726 * @def: the type of default value
727 * @defaultValue: the attribute default value
728 * @tree: the tree of enumerated value set
730 * An attribute definition has been parsed
733 xmlSAX2AttributeDecl(void *ctx, const xmlChar *elem, const xmlChar *fullname,
734 int type, int def, const xmlChar *defaultValue,
735 xmlEnumerationPtr tree)
737 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
738 xmlAttributePtr attr;
739 xmlChar *name = NULL, *prefix = NULL;
741 if ((ctxt == NULL) || (ctxt->myDoc == NULL))
745 xmlGenericError(xmlGenericErrorContext,
746 "SAX.xmlSAX2AttributeDecl(%s, %s, %d, %d, %s, ...)\n",
747 elem, fullname, type, def, defaultValue);
749 if ((xmlStrEqual(fullname, BAD_CAST "xml:id")) &&
750 (type != XML_ATTRIBUTE_ID)) {
752 * Raise the error but keep the validity flag
754 int tmp = ctxt->valid;
755 xmlErrValid(ctxt, XML_DTD_XMLID_TYPE,
756 "xml:id : attribute type should be ID\n", NULL, NULL);
759 /* TODO: optimize name/prefix allocation */
760 name = xmlSplitQName(ctxt, fullname, &prefix);
761 ctxt->vctxt.valid = 1;
762 if (ctxt->inSubset == 1)
763 attr = xmlAddAttributeDecl(&ctxt->vctxt, ctxt->myDoc->intSubset, elem,
764 name, prefix, (xmlAttributeType) type,
765 (xmlAttributeDefault) def, defaultValue, tree);
766 else if (ctxt->inSubset == 2)
767 attr = xmlAddAttributeDecl(&ctxt->vctxt, ctxt->myDoc->extSubset, elem,
768 name, prefix, (xmlAttributeType) type,
769 (xmlAttributeDefault) def, defaultValue, tree);
771 xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
772 "SAX.xmlSAX2AttributeDecl(%s) called while not in subset\n",
774 xmlFreeEnumeration(tree);
777 #ifdef LIBXML_VALID_ENABLED
778 if (ctxt->vctxt.valid == 0)
780 if ((attr != NULL) && (ctxt->validate) && (ctxt->wellFormed) &&
781 (ctxt->myDoc->intSubset != NULL))
782 ctxt->valid &= xmlValidateAttributeDecl(&ctxt->vctxt, ctxt->myDoc,
784 #endif /* LIBXML_VALID_ENABLED */
792 * xmlSAX2ElementDecl:
793 * @ctx: the user data (XML parser context)
794 * @name: the element name
795 * @type: the element type
796 * @content: the element value tree
798 * An element definition has been parsed
801 xmlSAX2ElementDecl(void *ctx, const xmlChar * name, int type,
802 xmlElementContentPtr content)
804 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
805 xmlElementPtr elem = NULL;
807 if ((ctxt == NULL) || (ctxt->myDoc == NULL))
811 xmlGenericError(xmlGenericErrorContext,
812 "SAX.xmlSAX2ElementDecl(%s, %d, ...)\n", name, type);
815 if (ctxt->inSubset == 1)
816 elem = xmlAddElementDecl(&ctxt->vctxt, ctxt->myDoc->intSubset,
817 name, (xmlElementTypeVal) type, content);
818 else if (ctxt->inSubset == 2)
819 elem = xmlAddElementDecl(&ctxt->vctxt, ctxt->myDoc->extSubset,
820 name, (xmlElementTypeVal) type, content);
822 xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
823 "SAX.xmlSAX2ElementDecl(%s) called while not in subset\n",
827 #ifdef LIBXML_VALID_ENABLED
830 if (ctxt->validate && ctxt->wellFormed &&
831 ctxt->myDoc && ctxt->myDoc->intSubset)
833 xmlValidateElementDecl(&ctxt->vctxt, ctxt->myDoc, elem);
834 #endif /* LIBXML_VALID_ENABLED */
838 * xmlSAX2NotationDecl:
839 * @ctx: the user data (XML parser context)
840 * @name: The name of the notation
841 * @publicId: The public ID of the entity
842 * @systemId: The system ID of the entity
844 * What to do when a notation declaration has been parsed.
847 xmlSAX2NotationDecl(void *ctx, const xmlChar *name,
848 const xmlChar *publicId, const xmlChar *systemId)
850 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
851 xmlNotationPtr nota = NULL;
853 if ((ctxt == NULL) || (ctxt->myDoc == NULL))
857 xmlGenericError(xmlGenericErrorContext,
858 "SAX.xmlSAX2NotationDecl(%s, %s, %s)\n", name, publicId, systemId);
861 if ((publicId == NULL) && (systemId == NULL)) {
862 xmlFatalErrMsg(ctxt, XML_ERR_NOTATION_PROCESSING,
863 "SAX.xmlSAX2NotationDecl(%s) externalID or PublicID missing\n",
866 } else if (ctxt->inSubset == 1)
867 nota = xmlAddNotationDecl(&ctxt->vctxt, ctxt->myDoc->intSubset, name,
869 else if (ctxt->inSubset == 2)
870 nota = xmlAddNotationDecl(&ctxt->vctxt, ctxt->myDoc->extSubset, name,
873 xmlFatalErrMsg(ctxt, XML_ERR_NOTATION_PROCESSING,
874 "SAX.xmlSAX2NotationDecl(%s) called while not in subset\n",
878 #ifdef LIBXML_VALID_ENABLED
879 if (nota == NULL) ctxt->valid = 0;
880 if ((ctxt->validate) && (ctxt->wellFormed) &&
881 (ctxt->myDoc->intSubset != NULL))
882 ctxt->valid &= xmlValidateNotationDecl(&ctxt->vctxt, ctxt->myDoc,
884 #endif /* LIBXML_VALID_ENABLED */
888 * xmlSAX2UnparsedEntityDecl:
889 * @ctx: the user data (XML parser context)
890 * @name: The name of the entity
891 * @publicId: The public ID of the entity
892 * @systemId: The system ID of the entity
893 * @notationName: the name of the notation
895 * What to do when an unparsed entity declaration is parsed
898 xmlSAX2UnparsedEntityDecl(void *ctx, const xmlChar *name,
899 const xmlChar *publicId, const xmlChar *systemId,
900 const xmlChar *notationName)
903 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
904 if (ctx == NULL) return;
906 xmlGenericError(xmlGenericErrorContext,
907 "SAX.xmlSAX2UnparsedEntityDecl(%s, %s, %s, %s)\n",
908 name, publicId, systemId, notationName);
910 if (ctxt->inSubset == 1) {
911 ent = xmlAddDocEntity(ctxt->myDoc, name,
912 XML_EXTERNAL_GENERAL_UNPARSED_ENTITY,
913 publicId, systemId, notationName);
914 if ((ent == NULL) && (ctxt->pedantic) &&
915 (ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
916 ctxt->sax->warning(ctxt->userData,
917 "Entity(%s) already defined in the internal subset\n", name);
918 if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
920 const char *base = NULL;
922 if (ctxt->input != NULL)
923 base = ctxt->input->filename;
925 base = ctxt->directory;
927 URI = xmlBuildURI(systemId, (const xmlChar *) base);
930 } else if (ctxt->inSubset == 2) {
931 ent = xmlAddDtdEntity(ctxt->myDoc, name,
932 XML_EXTERNAL_GENERAL_UNPARSED_ENTITY,
933 publicId, systemId, notationName);
934 if ((ent == NULL) && (ctxt->pedantic) &&
935 (ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
936 ctxt->sax->warning(ctxt->userData,
937 "Entity(%s) already defined in the external subset\n", name);
938 if ((ent != NULL) && (ent->URI == NULL) && (systemId != NULL)) {
940 const char *base = NULL;
942 if (ctxt->input != NULL)
943 base = ctxt->input->filename;
945 base = ctxt->directory;
947 URI = xmlBuildURI(systemId, (const xmlChar *) base);
951 xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
952 "SAX.xmlSAX2UnparsedEntityDecl(%s) called while not in subset\n",
958 * xmlSAX2SetDocumentLocator:
959 * @ctx: the user data (XML parser context)
960 * @loc: A SAX Locator
962 * Receive the document locator at startup, actually xmlDefaultSAXLocator
963 * Everything is available on the context, so this is useless in our case.
966 xmlSAX2SetDocumentLocator(void *ctx ATTRIBUTE_UNUSED, xmlSAXLocatorPtr loc ATTRIBUTE_UNUSED)
968 /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
970 xmlGenericError(xmlGenericErrorContext,
971 "SAX.xmlSAX2SetDocumentLocator()\n");
976 * xmlSAX2StartDocument:
977 * @ctx: the user data (XML parser context)
979 * called when the document start being processed.
982 xmlSAX2StartDocument(void *ctx)
984 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
987 if (ctx == NULL) return;
990 xmlGenericError(xmlGenericErrorContext,
991 "SAX.xmlSAX2StartDocument()\n");
994 #ifdef LIBXML_HTML_ENABLED
995 if (ctxt->myDoc == NULL)
996 ctxt->myDoc = htmlNewDocNoDtD(NULL, NULL);
997 if (ctxt->myDoc == NULL) {
998 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument");
1001 ctxt->myDoc->properties = XML_DOC_HTML;
1002 ctxt->myDoc->parseFlags = ctxt->options;
1004 xmlGenericError(xmlGenericErrorContext,
1005 "libxml2 built without HTML support\n");
1006 ctxt->errNo = XML_ERR_INTERNAL_ERROR;
1007 ctxt->instate = XML_PARSER_EOF;
1008 ctxt->disableSAX = 1;
1012 doc = ctxt->myDoc = xmlNewDoc(ctxt->version);
1014 doc->properties = 0;
1015 if (ctxt->options & XML_PARSE_OLD10)
1016 doc->properties |= XML_DOC_OLD10;
1017 doc->parseFlags = ctxt->options;
1018 if (ctxt->encoding != NULL)
1019 doc->encoding = xmlStrdup(ctxt->encoding);
1021 doc->encoding = NULL;
1022 doc->standalone = ctxt->standalone;
1024 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument");
1027 if ((ctxt->dictNames) && (doc != NULL)) {
1028 doc->dict = ctxt->dict;
1029 xmlDictReference(doc->dict);
1032 if ((ctxt->myDoc != NULL) && (ctxt->myDoc->URL == NULL) &&
1033 (ctxt->input != NULL) && (ctxt->input->filename != NULL)) {
1034 ctxt->myDoc->URL = xmlPathToURI((const xmlChar *)ctxt->input->filename);
1035 if (ctxt->myDoc->URL == NULL)
1036 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartDocument");
1041 * xmlSAX2EndDocument:
1042 * @ctx: the user data (XML parser context)
1044 * called when the document end has been detected.
1047 xmlSAX2EndDocument(void *ctx)
1049 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1051 xmlGenericError(xmlGenericErrorContext,
1052 "SAX.xmlSAX2EndDocument()\n");
1054 if (ctx == NULL) return;
1055 #ifdef LIBXML_VALID_ENABLED
1056 if (ctxt->validate && ctxt->wellFormed &&
1057 ctxt->myDoc && ctxt->myDoc->intSubset)
1058 ctxt->valid &= xmlValidateDocumentFinal(&ctxt->vctxt, ctxt->myDoc);
1059 #endif /* LIBXML_VALID_ENABLED */
1062 * Grab the encoding if it was added on-the-fly
1064 if ((ctxt->encoding != NULL) && (ctxt->myDoc != NULL) &&
1065 (ctxt->myDoc->encoding == NULL)) {
1066 ctxt->myDoc->encoding = ctxt->encoding;
1067 ctxt->encoding = NULL;
1069 if ((ctxt->inputTab != NULL) &&
1070 (ctxt->inputNr > 0) && (ctxt->inputTab[0] != NULL) &&
1071 (ctxt->inputTab[0]->encoding != NULL) && (ctxt->myDoc != NULL) &&
1072 (ctxt->myDoc->encoding == NULL)) {
1073 ctxt->myDoc->encoding = xmlStrdup(ctxt->inputTab[0]->encoding);
1075 if ((ctxt->charset != XML_CHAR_ENCODING_NONE) && (ctxt->myDoc != NULL) &&
1076 (ctxt->myDoc->charset == XML_CHAR_ENCODING_NONE)) {
1077 ctxt->myDoc->charset = ctxt->charset;
1081 #if defined(LIBXML_SAX1_ENABLED) || defined(LIBXML_HTML_ENABLED) || defined(LIBXML_WRITER_ENABLED) || defined(LIBXML_DOCB_ENABLED) || defined(LIBXML_LEGACY_ENABLED)
1083 * xmlSAX2AttributeInternal:
1084 * @ctx: the user data (XML parser context)
1085 * @fullname: The attribute name, including namespace prefix
1086 * @value: The attribute value
1087 * @prefix: the prefix on the element node
1089 * Handle an attribute that has been read by the parser.
1090 * The default handling is to convert the attribute into an
1091 * DOM subtree and past it in a new xmlAttr element added to
1095 xmlSAX2AttributeInternal(void *ctx, const xmlChar *fullname,
1096 const xmlChar *value, const xmlChar *prefix ATTRIBUTE_UNUSED)
1098 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1106 name = xmlStrdup(fullname);
1111 * Split the full name into a namespace prefix and the tag name
1113 name = xmlSplitQName(ctxt, fullname, &ns);
1114 if ((name != NULL) && (name[0] == 0)) {
1115 if (xmlStrEqual(ns, BAD_CAST "xmlns")) {
1116 xmlNsErrMsg(ctxt, XML_ERR_NS_DECL_ERROR,
1117 "invalid namespace declaration '%s'\n",
1120 xmlNsWarnMsg(ctxt, XML_WAR_NS_COLUMN,
1121 "Avoid attribute ending with ':' like '%s'\n",
1128 name = xmlStrdup(fullname);
1132 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1138 #ifdef LIBXML_HTML_ENABLED
1140 (value == NULL) && (htmlIsBooleanAttr(fullname))) {
1141 nval = xmlStrdup(fullname);
1142 value = (const xmlChar *) nval;
1146 #ifdef LIBXML_VALID_ENABLED
1148 * Do the last stage of the attribute normalization
1149 * Needed for HTML too:
1150 * http://www.w3.org/TR/html4/types.html#h-6.2
1152 ctxt->vctxt.valid = 1;
1153 nval = xmlValidCtxtNormalizeAttributeValue(&ctxt->vctxt,
1154 ctxt->myDoc, ctxt->node,
1156 if (ctxt->vctxt.valid != 1) {
1163 #endif /* LIBXML_VALID_ENABLED */
1167 * Check whether it's a namespace definition
1169 if ((!ctxt->html) && (ns == NULL) &&
1170 (name[0] == 'x') && (name[1] == 'm') && (name[2] == 'l') &&
1171 (name[3] == 'n') && (name[4] == 's') && (name[5] == 0)) {
1175 if (!ctxt->replaceEntities) {
1177 val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF,
1181 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1187 val = (xmlChar *) value;
1193 uri = xmlParseURI((const char *)val);
1195 if ((ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
1196 ctxt->sax->warning(ctxt->userData,
1197 "xmlns: %s not a valid URI\n", val);
1199 if (uri->scheme == NULL) {
1200 if ((ctxt->sax != NULL) && (ctxt->sax->warning != NULL))
1201 ctxt->sax->warning(ctxt->userData,
1202 "xmlns: URI %s is not absolute\n", val);
1208 /* a default namespace definition */
1209 nsret = xmlNewNs(ctxt->node, val, NULL);
1211 #ifdef LIBXML_VALID_ENABLED
1213 * Validate also for namespace decls, they are attributes from
1214 * an XML-1.0 perspective
1216 if (nsret != NULL && ctxt->validate && ctxt->wellFormed &&
1217 ctxt->myDoc && ctxt->myDoc->intSubset)
1218 ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc,
1219 ctxt->node, prefix, nsret, val);
1220 #endif /* LIBXML_VALID_ENABLED */
1229 if ((!ctxt->html) &&
1230 (ns != NULL) && (ns[0] == 'x') && (ns[1] == 'm') && (ns[2] == 'l') &&
1231 (ns[3] == 'n') && (ns[4] == 's') && (ns[5] == 0)) {
1235 if (!ctxt->replaceEntities) {
1237 val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF,
1241 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1248 val = (xmlChar *) value;
1252 xmlNsErrMsg(ctxt, XML_NS_ERR_EMPTY,
1253 "Empty namespace name for prefix %s\n", name, NULL);
1255 if ((ctxt->pedantic != 0) && (val[0] != 0)) {
1258 uri = xmlParseURI((const char *)val);
1260 xmlNsWarnMsg(ctxt, XML_WAR_NS_URI,
1261 "xmlns:%s: %s not a valid URI\n", name, value);
1263 if (uri->scheme == NULL) {
1264 xmlNsWarnMsg(ctxt, XML_WAR_NS_URI_RELATIVE,
1265 "xmlns:%s: URI %s is not absolute\n", name, value);
1271 /* a standard namespace definition */
1272 nsret = xmlNewNs(ctxt->node, val, name);
1274 #ifdef LIBXML_VALID_ENABLED
1276 * Validate also for namespace decls, they are attributes from
1277 * an XML-1.0 perspective
1279 if (nsret != NULL && ctxt->validate && ctxt->wellFormed &&
1280 ctxt->myDoc && ctxt->myDoc->intSubset)
1281 ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc,
1282 ctxt->node, prefix, nsret, value);
1283 #endif /* LIBXML_VALID_ENABLED */
1294 namespace = xmlSearchNs(ctxt->myDoc, ctxt->node, ns);
1296 if (namespace == NULL) {
1297 xmlNsErrMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
1298 "Namespace prefix %s of attribute %s is not defined\n",
1303 prop = ctxt->node->properties;
1304 while (prop != NULL) {
1305 if (prop->ns != NULL) {
1306 if ((xmlStrEqual(name, prop->name)) &&
1307 ((namespace == prop->ns) ||
1308 (xmlStrEqual(namespace->href, prop->ns->href)))) {
1309 xmlNsErrMsg(ctxt, XML_ERR_ATTRIBUTE_REDEFINED,
1310 "Attribute %s in %s redefined\n",
1311 name, namespace->href);
1312 ctxt->wellFormed = 0;
1313 if (ctxt->recovery == 0) ctxt->disableSAX = 1;
1324 /* !!!!!! <a toto:arg="" xmlns:toto="http://toto.com"> */
1325 ret = xmlNewNsPropEatName(ctxt->node, namespace, name, NULL);
1328 if ((ctxt->replaceEntities == 0) && (!ctxt->html)) {
1331 ret->children = xmlStringGetNodeList(ctxt->myDoc, value);
1332 tmp = ret->children;
1333 while (tmp != NULL) {
1334 tmp->parent = (xmlNodePtr) ret;
1335 if (tmp->next == NULL)
1339 } else if (value != NULL) {
1340 ret->children = xmlNewDocText(ctxt->myDoc, value);
1341 ret->last = ret->children;
1342 if (ret->children != NULL)
1343 ret->children->parent = (xmlNodePtr) ret;
1347 #ifdef LIBXML_VALID_ENABLED
1348 if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed &&
1349 ctxt->myDoc && ctxt->myDoc->intSubset) {
1352 * If we don't substitute entities, the validation should be
1353 * done on a value with replaced entities anyway.
1355 if (!ctxt->replaceEntities) {
1359 val = xmlStringDecodeEntities(ctxt, value, XML_SUBSTITUTE_REF,
1364 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
1365 ctxt->myDoc, ctxt->node, ret, value);
1370 * Do the last stage of the attribute normalization
1371 * It need to be done twice ... it's an extra burden related
1372 * to the ability to keep xmlSAX2References in attributes
1374 nvalnorm = xmlValidNormalizeAttributeValue(ctxt->myDoc,
1375 ctxt->node, fullname, val);
1376 if (nvalnorm != NULL) {
1381 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
1382 ctxt->myDoc, ctxt->node, ret, val);
1386 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt, ctxt->myDoc,
1387 ctxt->node, ret, value);
1390 #endif /* LIBXML_VALID_ENABLED */
1391 if (((ctxt->loadsubset & XML_SKIP_IDS) == 0) &&
1392 (((ctxt->replaceEntities == 0) && (ctxt->external != 2)) ||
1393 ((ctxt->replaceEntities != 0) && (ctxt->inSubset == 0)))) {
1395 * when validating, the ID registration is done at the attribute
1396 * validation level. Otherwise we have to do specific handling here.
1398 if (xmlStrEqual(fullname, BAD_CAST "xml:id")) {
1400 * Add the xml:id value
1402 * Open issue: normalization of the value.
1404 if (xmlValidateNCName(value, 1) != 0) {
1405 xmlErrValid(ctxt, XML_DTD_XMLID_VALUE,
1406 "xml:id : attribute value %s is not an NCName\n",
1407 (const char *) value, NULL);
1409 xmlAddID(&ctxt->vctxt, ctxt->myDoc, value, ret);
1410 } else if (xmlIsID(ctxt->myDoc, ctxt->node, ret))
1411 xmlAddID(&ctxt->vctxt, ctxt->myDoc, value, ret);
1412 else if (xmlIsRef(ctxt->myDoc, ctxt->node, ret))
1413 xmlAddRef(&ctxt->vctxt, ctxt->myDoc, value, ret);
1424 * xmlCheckDefaultedAttributes:
1426 * Check defaulted attributes from the DTD
1429 xmlCheckDefaultedAttributes(xmlParserCtxtPtr ctxt, const xmlChar *name,
1430 const xmlChar *prefix, const xmlChar **atts) {
1431 xmlElementPtr elemDecl;
1436 elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->intSubset, name, prefix);
1437 if (elemDecl == NULL) {
1438 elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->extSubset, name, prefix);
1442 process_external_subset:
1444 if (elemDecl != NULL) {
1445 xmlAttributePtr attr = elemDecl->attributes;
1447 * Check against defaulted attributes from the external subset
1448 * if the document is stamped as standalone
1450 if ((ctxt->myDoc->standalone == 1) &&
1451 (ctxt->myDoc->extSubset != NULL) &&
1453 while (attr != NULL) {
1454 if ((attr->defaultValue != NULL) &&
1455 (xmlGetDtdQAttrDesc(ctxt->myDoc->extSubset,
1456 attr->elem, attr->name,
1457 attr->prefix) == attr) &&
1458 (xmlGetDtdQAttrDesc(ctxt->myDoc->intSubset,
1459 attr->elem, attr->name,
1460 attr->prefix) == NULL)) {
1463 if (attr->prefix != NULL) {
1464 fulln = xmlStrdup(attr->prefix);
1465 fulln = xmlStrcat(fulln, BAD_CAST ":");
1466 fulln = xmlStrcat(fulln, attr->name);
1468 fulln = xmlStrdup(attr->name);
1470 if (fulln == NULL) {
1471 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1476 * Check that the attribute is not declared in the
1483 while (att != NULL) {
1484 if (xmlStrEqual(att, fulln))
1491 xmlErrValid(ctxt, XML_DTD_STANDALONE_DEFAULTED,
1492 "standalone: attribute %s on %s defaulted from external subset\n",
1493 (const char *)fulln,
1494 (const char *)attr->elem);
1503 * Actually insert defaulted values when needed
1505 attr = elemDecl->attributes;
1506 while (attr != NULL) {
1508 * Make sure that attributes redefinition occuring in the
1509 * internal subset are not overriden by definitions in the
1512 if (attr->defaultValue != NULL) {
1514 * the element should be instantiated in the tree if:
1515 * - this is a namespace prefix
1516 * - the user required for completion in the tree
1518 * - there isn't already an attribute definition
1519 * in the internal subset overriding it.
1521 if (((attr->prefix != NULL) &&
1522 (xmlStrEqual(attr->prefix, BAD_CAST "xmlns"))) ||
1523 ((attr->prefix == NULL) &&
1524 (xmlStrEqual(attr->name, BAD_CAST "xmlns"))) ||
1525 (ctxt->loadsubset & XML_COMPLETE_ATTRS)) {
1526 xmlAttributePtr tst;
1528 tst = xmlGetDtdQAttrDesc(ctxt->myDoc->intSubset,
1529 attr->elem, attr->name,
1531 if ((tst == attr) || (tst == NULL)) {
1535 fulln = xmlBuildQName(attr->name, attr->prefix, fn, 50);
1536 if (fulln == NULL) {
1537 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1542 * Check that the attribute is not declared in the
1549 while (att != NULL) {
1550 if (xmlStrEqual(att, fulln))
1557 xmlSAX2AttributeInternal(ctxt, fulln,
1558 attr->defaultValue, prefix);
1560 if ((fulln != fn) && (fulln != attr->name))
1567 if (internal == 1) {
1568 elemDecl = xmlGetDtdQElementDesc(ctxt->myDoc->extSubset,
1571 goto process_external_subset;
1577 * xmlSAX2StartElement:
1578 * @ctx: the user data (XML parser context)
1579 * @fullname: The element name, including namespace prefix
1580 * @atts: An array of name/value attributes pairs, NULL terminated
1582 * called when an opening tag has been processed.
1585 xmlSAX2StartElement(void *ctx, const xmlChar *fullname, const xmlChar **atts)
1587 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1594 const xmlChar *value;
1597 if ((ctx == NULL) || (fullname == NULL) || (ctxt->myDoc == NULL)) return;
1598 parent = ctxt->node;
1600 xmlGenericError(xmlGenericErrorContext,
1601 "SAX.xmlSAX2StartElement(%s)\n", fullname);
1605 * First check on validity:
1607 if (ctxt->validate && (ctxt->myDoc->extSubset == NULL) &&
1608 ((ctxt->myDoc->intSubset == NULL) ||
1609 ((ctxt->myDoc->intSubset->notations == NULL) &&
1610 (ctxt->myDoc->intSubset->elements == NULL) &&
1611 (ctxt->myDoc->intSubset->attributes == NULL) &&
1612 (ctxt->myDoc->intSubset->entities == NULL)))) {
1613 xmlErrValid(ctxt, XML_ERR_NO_DTD,
1614 "Validation failed: no DTD found !", NULL, NULL);
1620 * Split the full name into a namespace prefix and the tag name
1622 name = xmlSplitQName(ctxt, fullname, &prefix);
1626 * Note : the namespace resolution is deferred until the end of the
1627 * attributes parsing, since local namespace can be defined as
1628 * an attribute at this level.
1630 ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL, name, NULL);
1634 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElement");
1637 if (ctxt->myDoc->children == NULL) {
1638 #ifdef DEBUG_SAX_TREE
1639 xmlGenericError(xmlGenericErrorContext, "Setting %s as root\n", name);
1641 xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
1642 } else if (parent == NULL) {
1643 parent = ctxt->myDoc->children;
1646 if (ctxt->linenumbers) {
1647 if (ctxt->input != NULL) {
1648 if (ctxt->input->line < 65535)
1649 ret->line = (short) ctxt->input->line;
1656 * We are parsing a new node.
1658 #ifdef DEBUG_SAX_TREE
1659 xmlGenericError(xmlGenericErrorContext, "pushing(%s)\n", name);
1661 nodePush(ctxt, ret);
1664 * Link the child element
1666 if (parent != NULL) {
1667 if (parent->type == XML_ELEMENT_NODE) {
1668 #ifdef DEBUG_SAX_TREE
1669 xmlGenericError(xmlGenericErrorContext,
1670 "adding child %s to %s\n", name, parent->name);
1672 xmlAddChild(parent, ret);
1674 #ifdef DEBUG_SAX_TREE
1675 xmlGenericError(xmlGenericErrorContext,
1676 "adding sibling %s to ", name);
1677 xmlDebugDumpOneNode(stderr, parent, 0);
1679 xmlAddSibling(parent, ret);
1684 * Insert all the defaulted attributes from the DTD especially namespaces
1686 if ((!ctxt->html) &&
1687 ((ctxt->myDoc->intSubset != NULL) ||
1688 (ctxt->myDoc->extSubset != NULL))) {
1689 xmlCheckDefaultedAttributes(ctxt, name, prefix, atts);
1693 * process all the attributes whose name start with "xmlns"
1700 while ((att != NULL) && (value != NULL)) {
1701 if ((att[0] == 'x') && (att[1] == 'm') && (att[2] == 'l') &&
1702 (att[3] == 'n') && (att[4] == 's'))
1703 xmlSAX2AttributeInternal(ctxt, att, value, prefix);
1712 * Search the namespace, note that since the attributes have been
1713 * processed, the local namespaces are available.
1715 ns = xmlSearchNs(ctxt->myDoc, ret, prefix);
1716 if ((ns == NULL) && (parent != NULL))
1717 ns = xmlSearchNs(ctxt->myDoc, parent, prefix);
1718 if ((prefix != NULL) && (ns == NULL)) {
1719 ns = xmlNewNs(ret, NULL, prefix);
1720 xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
1721 "Namespace prefix %s is not defined\n",
1726 * set the namespace node, making sure that if the default namspace
1727 * is unbound on a parent we simply kee it NULL
1729 if ((ns != NULL) && (ns->href != NULL) &&
1730 ((ns->href[0] != 0) || (ns->prefix != NULL)))
1734 * process all the other attributes
1741 while (att != NULL) {
1742 xmlSAX2AttributeInternal(ctxt, att, value, NULL);
1747 while ((att != NULL) && (value != NULL)) {
1748 if ((att[0] != 'x') || (att[1] != 'm') || (att[2] != 'l') ||
1749 (att[3] != 'n') || (att[4] != 's'))
1750 xmlSAX2AttributeInternal(ctxt, att, value, NULL);
1761 #ifdef LIBXML_VALID_ENABLED
1763 * If it's the Document root, finish the DTD validation and
1764 * check the document root element for validity
1766 if ((ctxt->validate) && (ctxt->vctxt.finishDtd == XML_CTXT_FINISH_DTD_0)) {
1769 chk = xmlValidateDtdFinal(&ctxt->vctxt, ctxt->myDoc);
1773 ctxt->wellFormed = 0;
1774 ctxt->valid &= xmlValidateRoot(&ctxt->vctxt, ctxt->myDoc);
1775 ctxt->vctxt.finishDtd = XML_CTXT_FINISH_DTD_1;
1777 #endif /* LIBXML_VALID_ENABLED */
1785 * xmlSAX2EndElement:
1786 * @ctx: the user data (XML parser context)
1787 * @name: The element name
1789 * called when the end of an element has been detected.
1792 xmlSAX2EndElement(void *ctx, const xmlChar *name ATTRIBUTE_UNUSED)
1794 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
1797 if (ctx == NULL) return;
1801 xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2EndElement(NULL)\n");
1803 xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2EndElement(%s)\n", name);
1806 /* Capture end position and add node */
1807 if (cur != NULL && ctxt->record_info) {
1808 ctxt->nodeInfo->end_pos = ctxt->input->cur - ctxt->input->base;
1809 ctxt->nodeInfo->end_line = ctxt->input->line;
1810 ctxt->nodeInfo->node = cur;
1811 xmlParserAddNodeInfo(ctxt, ctxt->nodeInfo);
1815 #ifdef LIBXML_VALID_ENABLED
1816 if (ctxt->validate && ctxt->wellFormed &&
1817 ctxt->myDoc && ctxt->myDoc->intSubset)
1818 ctxt->valid &= xmlValidateOneElement(&ctxt->vctxt, ctxt->myDoc,
1820 #endif /* LIBXML_VALID_ENABLED */
1824 * end of parsing of this node.
1826 #ifdef DEBUG_SAX_TREE
1827 xmlGenericError(xmlGenericErrorContext, "popping(%s)\n", cur->name);
1831 #endif /* LIBXML_SAX1_ENABLED || LIBXML_HTML_ENABLED || LIBXML_LEGACY_ENABLED */
1835 * @ctxt: the parser context
1836 * @str: the input string
1837 * @len: the string length
1839 * Callback for a text node
1841 * Returns the newly allocated string or NULL if not needed or error
1844 xmlSAX2TextNode(xmlParserCtxtPtr ctxt, const xmlChar *str, int len) {
1846 const xmlChar *intern = NULL;
1851 if (ctxt->freeElems != NULL) {
1852 ret = ctxt->freeElems;
1853 ctxt->freeElems = ret->next;
1854 ctxt->freeElemsNr--;
1856 ret = (xmlNodePtr) xmlMalloc(sizeof(xmlNode));
1859 xmlErrMemory(ctxt, "xmlSAX2Characters");
1862 memset(ret, 0, sizeof(xmlNode));
1864 * intern the formatting blanks found between tags, or the
1865 * very short strings
1867 if (ctxt->dictNames) {
1868 xmlChar cur = str[len];
1870 if ((len < (int) (2 * sizeof(void *))) &&
1871 (ctxt->options & XML_PARSE_COMPACT)) {
1872 /* store the string in the node overriding properties and nsDef */
1873 xmlChar *tmp = (xmlChar *) &(ret->properties);
1874 memcpy(tmp, str, len);
1877 } else if ((len <= 3) && ((cur == '"') || (cur == '\'') ||
1878 ((cur == '<') && (str[len + 1] != '!')))) {
1879 intern = xmlDictLookup(ctxt->dict, str, len);
1880 } else if (IS_BLANK_CH(*str) && (len < 60) && (cur == '<') &&
1881 (str[len + 1] != '!')) {
1884 for (i = 1;i < len;i++) {
1885 if (!IS_BLANK_CH(str[i])) goto skip;
1887 intern = xmlDictLookup(ctxt->dict, str, len);
1891 ret->type = XML_TEXT_NODE;
1893 ret->name = xmlStringText;
1894 if (intern == NULL) {
1895 ret->content = xmlStrndup(str, len);
1896 if (ret->content == NULL) {
1897 xmlSAX2ErrMemory(ctxt, "xmlSAX2TextNode");
1902 ret->content = (xmlChar *) intern;
1904 if (ctxt->linenumbers) {
1905 if (ctxt->input != NULL) {
1906 if (ctxt->input->line < 65535)
1907 ret->line = (short) ctxt->input->line;
1910 if (ctxt->options & XML_PARSE_BIG_LINES)
1911 ret->psvi = (void *) (long) ctxt->input->line;
1916 if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue))
1917 xmlRegisterNodeDefaultValue(ret);
1921 #ifdef LIBXML_VALID_ENABLED
1923 * xmlSAX2DecodeAttrEntities:
1924 * @ctxt: the parser context
1925 * @str: the input string
1926 * @len: the string length
1928 * Remove the entities from an attribute value
1930 * Returns the newly allocated string or NULL if not needed or error
1933 xmlSAX2DecodeAttrEntities(xmlParserCtxtPtr ctxt, const xmlChar *str,
1934 const xmlChar *end) {
1945 ret = xmlStringLenDecodeEntities(ctxt, str, end - str,
1946 XML_SUBSTITUTE_REF, 0,0,0);
1950 #endif /* LIBXML_VALID_ENABLED */
1953 * xmlSAX2AttributeNs:
1954 * @ctx: the user data (XML parser context)
1955 * @localname: the local name of the attribute
1956 * @prefix: the attribute namespace prefix if available
1957 * @URI: the attribute namespace name if available
1958 * @value: Start of the attribute value
1959 * @valueend: end of the attribute value
1961 * Handle an attribute that has been read by the parser.
1962 * The default handling is to convert the attribute into an
1963 * DOM subtree and past it in a new xmlAttr element added to
1967 xmlSAX2AttributeNs(xmlParserCtxtPtr ctxt,
1968 const xmlChar * localname,
1969 const xmlChar * prefix,
1970 const xmlChar * value,
1971 const xmlChar * valueend)
1974 xmlNsPtr namespace = NULL;
1975 xmlChar *dup = NULL;
1978 * Note: if prefix == NULL, the attribute is not in the default namespace
1981 namespace = xmlSearchNs(ctxt->myDoc, ctxt->node, prefix);
1986 if (ctxt->freeAttrs != NULL) {
1987 ret = ctxt->freeAttrs;
1988 ctxt->freeAttrs = ret->next;
1989 ctxt->freeAttrsNr--;
1990 memset(ret, 0, sizeof(xmlAttr));
1991 ret->type = XML_ATTRIBUTE_NODE;
1993 ret->parent = ctxt->node;
1994 ret->doc = ctxt->myDoc;
1995 ret->ns = namespace;
1997 if (ctxt->dictNames)
1998 ret->name = localname;
2000 ret->name = xmlStrdup(localname);
2002 /* link at the end to preserv order, TODO speed up with a last */
2003 if (ctxt->node->properties == NULL) {
2004 ctxt->node->properties = ret;
2006 xmlAttrPtr prev = ctxt->node->properties;
2008 while (prev->next != NULL) prev = prev->next;
2013 if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue))
2014 xmlRegisterNodeDefaultValue((xmlNodePtr)ret);
2016 if (ctxt->dictNames)
2017 ret = xmlNewNsPropEatName(ctxt->node, namespace,
2018 (xmlChar *) localname, NULL);
2020 ret = xmlNewNsProp(ctxt->node, namespace, localname, NULL);
2022 xmlErrMemory(ctxt, "xmlSAX2AttributeNs");
2027 if ((ctxt->replaceEntities == 0) && (!ctxt->html)) {
2031 * We know that if there is an entity reference, then
2032 * the string has been dup'ed and terminates with 0
2033 * otherwise with ' or "
2035 if (*valueend != 0) {
2036 tmp = xmlSAX2TextNode(ctxt, value, valueend - value);
2037 ret->children = tmp;
2040 tmp->doc = ret->doc;
2041 tmp->parent = (xmlNodePtr) ret;
2044 ret->children = xmlStringLenGetNodeList(ctxt->myDoc, value,
2046 tmp = ret->children;
2047 while (tmp != NULL) {
2048 tmp->doc = ret->doc;
2049 tmp->parent = (xmlNodePtr) ret;
2050 if (tmp->next == NULL)
2055 } else if (value != NULL) {
2058 tmp = xmlSAX2TextNode(ctxt, value, valueend - value);
2059 ret->children = tmp;
2062 tmp->doc = ret->doc;
2063 tmp->parent = (xmlNodePtr) ret;
2067 #ifdef LIBXML_VALID_ENABLED
2068 if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed &&
2069 ctxt->myDoc && ctxt->myDoc->intSubset) {
2071 * If we don't substitute entities, the validation should be
2072 * done on a value with replaced entities anyway.
2074 if (!ctxt->replaceEntities) {
2075 dup = xmlSAX2DecodeAttrEntities(ctxt, value, valueend);
2077 if (*valueend == 0) {
2078 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2079 ctxt->myDoc, ctxt->node, ret, value);
2082 * That should already be normalized.
2083 * cheaper to finally allocate here than duplicate
2084 * entry points in the full validation code
2086 dup = xmlStrndup(value, valueend - value);
2088 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2089 ctxt->myDoc, ctxt->node, ret, dup);
2093 * dup now contains a string of the flattened attribute
2094 * content with entities substitued. Check if we need to
2095 * apply an extra layer of normalization.
2096 * It need to be done twice ... it's an extra burden related
2097 * to the ability to keep references in attributes
2099 if (ctxt->attsSpecial != NULL) {
2104 fullname = xmlBuildQName(localname, prefix, fn, 50);
2105 if (fullname != NULL) {
2106 ctxt->vctxt.valid = 1;
2107 nvalnorm = xmlValidCtxtNormalizeAttributeValue(
2108 &ctxt->vctxt, ctxt->myDoc,
2109 ctxt->node, fullname, dup);
2110 if (ctxt->vctxt.valid != 1)
2113 if ((fullname != fn) && (fullname != localname))
2115 if (nvalnorm != NULL) {
2122 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2123 ctxt->myDoc, ctxt->node, ret, dup);
2127 * if entities already have been substitued, then
2128 * the attribute as passed is already normalized
2130 dup = xmlStrndup(value, valueend - value);
2132 ctxt->valid &= xmlValidateOneAttribute(&ctxt->vctxt,
2133 ctxt->myDoc, ctxt->node, ret, dup);
2136 #endif /* LIBXML_VALID_ENABLED */
2137 if (((ctxt->loadsubset & XML_SKIP_IDS) == 0) &&
2138 (((ctxt->replaceEntities == 0) && (ctxt->external != 2)) ||
2139 ((ctxt->replaceEntities != 0) && (ctxt->inSubset == 0)))) {
2141 * when validating, the ID registration is done at the attribute
2142 * validation level. Otherwise we have to do specific handling here.
2144 if ((prefix == ctxt->str_xml) &&
2145 (localname[0] == 'i') && (localname[1] == 'd') &&
2146 (localname[2] == 0)) {
2148 * Add the xml:id value
2150 * Open issue: normalization of the value.
2153 dup = xmlStrndup(value, valueend - value);
2154 #if defined(LIBXML_SAX1_ENABLED) || defined(LIBXML_HTML_ENABLED) || defined(LIBXML_WRITER_ENABLED) || defined(LIBXML_DOCB_ENABLED) || defined(LIBXML_LEGACY_ENABLED)
2155 #ifdef LIBXML_VALID_ENABLED
2156 if (xmlValidateNCName(dup, 1) != 0) {
2157 xmlErrValid(ctxt, XML_DTD_XMLID_VALUE,
2158 "xml:id : attribute value %s is not an NCName\n",
2159 (const char *) dup, NULL);
2163 xmlAddID(&ctxt->vctxt, ctxt->myDoc, dup, ret);
2164 } else if (xmlIsID(ctxt->myDoc, ctxt->node, ret)) {
2165 /* might be worth duplicate entry points and not copy */
2167 dup = xmlStrndup(value, valueend - value);
2168 xmlAddID(&ctxt->vctxt, ctxt->myDoc, dup, ret);
2169 } else if (xmlIsRef(ctxt->myDoc, ctxt->node, ret)) {
2171 dup = xmlStrndup(value, valueend - value);
2172 xmlAddRef(&ctxt->vctxt, ctxt->myDoc, dup, ret);
2180 * xmlSAX2StartElementNs:
2181 * @ctx: the user data (XML parser context)
2182 * @localname: the local name of the element
2183 * @prefix: the element namespace prefix if available
2184 * @URI: the element namespace name if available
2185 * @nb_namespaces: number of namespace definitions on that node
2186 * @namespaces: pointer to the array of prefix/URI pairs namespace definitions
2187 * @nb_attributes: the number of attributes on that node
2188 * @nb_defaulted: the number of defaulted attributes.
2189 * @attributes: pointer to the array of (localname/prefix/URI/value/end)
2192 * SAX2 callback when an element start has been detected by the parser.
2193 * It provides the namespace informations for the element, as well as
2194 * the new namespace declarations on the element.
2197 xmlSAX2StartElementNs(void *ctx,
2198 const xmlChar *localname,
2199 const xmlChar *prefix,
2202 const xmlChar **namespaces,
2205 const xmlChar **attributes)
2207 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2210 xmlNsPtr last = NULL, ns;
2211 const xmlChar *uri, *pref;
2212 xmlChar *lname = NULL;
2215 if (ctx == NULL) return;
2216 parent = ctxt->node;
2218 * First check on validity:
2220 if (ctxt->validate && (ctxt->myDoc->extSubset == NULL) &&
2221 ((ctxt->myDoc->intSubset == NULL) ||
2222 ((ctxt->myDoc->intSubset->notations == NULL) &&
2223 (ctxt->myDoc->intSubset->elements == NULL) &&
2224 (ctxt->myDoc->intSubset->attributes == NULL) &&
2225 (ctxt->myDoc->intSubset->entities == NULL)))) {
2226 xmlErrValid(ctxt, XML_DTD_NO_DTD,
2227 "Validation failed: no DTD found !", NULL, NULL);
2232 * Take care of the rare case of an undefined namespace prefix
2234 if ((prefix != NULL) && (URI == NULL)) {
2235 if (ctxt->dictNames) {
2236 const xmlChar *fullname;
2238 fullname = xmlDictQLookup(ctxt->dict, prefix, localname);
2239 if (fullname != NULL)
2240 localname = fullname;
2242 lname = xmlBuildQName(localname, prefix, NULL, 0);
2248 if (ctxt->freeElems != NULL) {
2249 ret = ctxt->freeElems;
2250 ctxt->freeElems = ret->next;
2251 ctxt->freeElemsNr--;
2252 memset(ret, 0, sizeof(xmlNode));
2253 ret->type = XML_ELEMENT_NODE;
2255 if (ctxt->dictNames)
2256 ret->name = localname;
2259 ret->name = xmlStrdup(localname);
2262 if (ret->name == NULL) {
2263 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs");
2267 if ((__xmlRegisterCallbacks) && (xmlRegisterNodeDefaultValue))
2268 xmlRegisterNodeDefaultValue(ret);
2270 if (ctxt->dictNames)
2271 ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL,
2272 (xmlChar *) localname, NULL);
2273 else if (lname == NULL)
2274 ret = xmlNewDocNode(ctxt->myDoc, NULL, localname, NULL);
2276 ret = xmlNewDocNodeEatName(ctxt->myDoc, NULL,
2277 (xmlChar *) lname, NULL);
2279 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs");
2283 if (ctxt->linenumbers) {
2284 if (ctxt->input != NULL) {
2285 if (ctxt->input->line < 65535)
2286 ret->line = (short) ctxt->input->line;
2292 if (parent == NULL) {
2293 xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
2296 * Build the namespace list
2298 for (i = 0,j = 0;j < nb_namespaces;j++) {
2299 pref = namespaces[i++];
2300 uri = namespaces[i++];
2301 ns = xmlNewNs(NULL, uri, pref);
2304 ret->nsDef = last = ns;
2309 if ((URI != NULL) && (prefix == pref))
2313 * any out of memory error would already have been raised
2314 * but we can't be garanteed it's the actual error due to the
2315 * API, best is to skip in this case
2319 #ifdef LIBXML_VALID_ENABLED
2320 if ((!ctxt->html) && ctxt->validate && ctxt->wellFormed &&
2321 ctxt->myDoc && ctxt->myDoc->intSubset) {
2322 ctxt->valid &= xmlValidateOneNamespace(&ctxt->vctxt, ctxt->myDoc,
2323 ret, prefix, ns, uri);
2325 #endif /* LIBXML_VALID_ENABLED */
2330 * We are parsing a new node.
2332 nodePush(ctxt, ret);
2335 * Link the child element
2337 if (parent != NULL) {
2338 if (parent->type == XML_ELEMENT_NODE) {
2339 xmlAddChild(parent, ret);
2341 xmlAddSibling(parent, ret);
2346 * Insert the defaulted attributes from the DTD only if requested:
2348 if ((nb_defaulted != 0) &&
2349 ((ctxt->loadsubset & XML_COMPLETE_ATTRS) == 0))
2350 nb_attributes -= nb_defaulted;
2353 * Search the namespace if it wasn't already found
2354 * Note that, if prefix is NULL, this searches for the default Ns
2356 if ((URI != NULL) && (ret->ns == NULL)) {
2357 ret->ns = xmlSearchNs(ctxt->myDoc, parent, prefix);
2358 if ((ret->ns == NULL) && (xmlStrEqual(prefix, BAD_CAST "xml"))) {
2359 ret->ns = xmlSearchNs(ctxt->myDoc, ret, prefix);
2361 if (ret->ns == NULL) {
2362 ns = xmlNewNs(ret, NULL, prefix);
2365 xmlSAX2ErrMemory(ctxt, "xmlSAX2StartElementNs");
2369 xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
2370 "Namespace prefix %s was not found\n",
2373 xmlNsWarnMsg(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
2374 "Namespace default prefix was not found\n",
2380 * process all the other attributes
2382 if (nb_attributes > 0) {
2383 for (j = 0,i = 0;i < nb_attributes;i++,j+=5) {
2385 * Handle the rare case of an undefined atribute prefix
2387 if ((attributes[j+1] != NULL) && (attributes[j+2] == NULL)) {
2388 if (ctxt->dictNames) {
2389 const xmlChar *fullname;
2391 fullname = xmlDictQLookup(ctxt->dict, attributes[j+1],
2393 if (fullname != NULL) {
2394 xmlSAX2AttributeNs(ctxt, fullname, NULL,
2395 attributes[j+3], attributes[j+4]);
2399 lname = xmlBuildQName(attributes[j], attributes[j+1],
2401 if (lname != NULL) {
2402 xmlSAX2AttributeNs(ctxt, lname, NULL,
2403 attributes[j+3], attributes[j+4]);
2409 xmlSAX2AttributeNs(ctxt, attributes[j], attributes[j+1],
2410 attributes[j+3], attributes[j+4]);
2414 #ifdef LIBXML_VALID_ENABLED
2416 * If it's the Document root, finish the DTD validation and
2417 * check the document root element for validity
2419 if ((ctxt->validate) && (ctxt->vctxt.finishDtd == XML_CTXT_FINISH_DTD_0)) {
2422 chk = xmlValidateDtdFinal(&ctxt->vctxt, ctxt->myDoc);
2426 ctxt->wellFormed = 0;
2427 ctxt->valid &= xmlValidateRoot(&ctxt->vctxt, ctxt->myDoc);
2428 ctxt->vctxt.finishDtd = XML_CTXT_FINISH_DTD_1;
2430 #endif /* LIBXML_VALID_ENABLED */
2434 * xmlSAX2EndElementNs:
2435 * @ctx: the user data (XML parser context)
2436 * @localname: the local name of the element
2437 * @prefix: the element namespace prefix if available
2438 * @URI: the element namespace name if available
2440 * SAX2 callback when an element end has been detected by the parser.
2441 * It provides the namespace informations for the element.
2444 xmlSAX2EndElementNs(void *ctx,
2445 const xmlChar * localname ATTRIBUTE_UNUSED,
2446 const xmlChar * prefix ATTRIBUTE_UNUSED,
2447 const xmlChar * URI ATTRIBUTE_UNUSED)
2449 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2450 xmlParserNodeInfo node_info;
2453 if (ctx == NULL) return;
2455 /* Capture end position and add node */
2456 if ((ctxt->record_info) && (cur != NULL)) {
2457 node_info.end_pos = ctxt->input->cur - ctxt->input->base;
2458 node_info.end_line = ctxt->input->line;
2459 node_info.node = cur;
2460 xmlParserAddNodeInfo(ctxt, &node_info);
2464 #ifdef LIBXML_VALID_ENABLED
2465 if (ctxt->validate && ctxt->wellFormed &&
2466 ctxt->myDoc && ctxt->myDoc->intSubset)
2467 ctxt->valid &= xmlValidateOneElement(&ctxt->vctxt, ctxt->myDoc, cur);
2468 #endif /* LIBXML_VALID_ENABLED */
2471 * end of parsing of this node.
2478 * @ctx: the user data (XML parser context)
2479 * @name: The entity name
2481 * called when an entity xmlSAX2Reference is detected.
2484 xmlSAX2Reference(void *ctx, const xmlChar *name)
2486 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2489 if (ctx == NULL) return;
2491 xmlGenericError(xmlGenericErrorContext,
2492 "SAX.xmlSAX2Reference(%s)\n", name);
2495 ret = xmlNewCharRef(ctxt->myDoc, name);
2497 ret = xmlNewReference(ctxt->myDoc, name);
2498 #ifdef DEBUG_SAX_TREE
2499 xmlGenericError(xmlGenericErrorContext,
2500 "add xmlSAX2Reference %s to %s \n", name, ctxt->node->name);
2502 if (xmlAddChild(ctxt->node, ret) == NULL) {
2508 * xmlSAX2Characters:
2509 * @ctx: the user data (XML parser context)
2510 * @ch: a xmlChar string
2511 * @len: the number of xmlChar
2513 * receiving some chars from the parser.
2516 xmlSAX2Characters(void *ctx, const xmlChar *ch, int len)
2518 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2519 xmlNodePtr lastChild;
2521 if (ctx == NULL) return;
2523 xmlGenericError(xmlGenericErrorContext,
2524 "SAX.xmlSAX2Characters(%.30s, %d)\n", ch, len);
2527 * Handle the data if any. If there is no child
2528 * add it as content, otherwise if the last child is text,
2529 * concatenate it, else create a new node of type text.
2532 if (ctxt->node == NULL) {
2533 #ifdef DEBUG_SAX_TREE
2534 xmlGenericError(xmlGenericErrorContext,
2535 "add chars: ctxt->node == NULL !\n");
2539 lastChild = ctxt->node->last;
2540 #ifdef DEBUG_SAX_TREE
2541 xmlGenericError(xmlGenericErrorContext,
2542 "add chars to %s \n", ctxt->node->name);
2546 * Here we needed an accelerator mechanism in case of very large
2547 * elements. Use an attribute in the structure !!!
2549 if (lastChild == NULL) {
2550 lastChild = xmlSAX2TextNode(ctxt, ch, len);
2551 if (lastChild != NULL) {
2552 ctxt->node->children = lastChild;
2553 ctxt->node->last = lastChild;
2554 lastChild->parent = ctxt->node;
2555 lastChild->doc = ctxt->node->doc;
2556 ctxt->nodelen = len;
2557 ctxt->nodemem = len + 1;
2559 xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters");
2563 int coalesceText = (lastChild != NULL) &&
2564 (lastChild->type == XML_TEXT_NODE) &&
2565 (lastChild->name == xmlStringText);
2566 if ((coalesceText) && (ctxt->nodemem != 0)) {
2568 * The whole point of maintaining nodelen and nodemem,
2569 * xmlTextConcat is too costly, i.e. compute length,
2570 * reallocate a new buffer, move data, append ch. Here
2571 * We try to minimaze realloc() uses and avoid copying
2572 * and recomputing length over and over.
2574 if (lastChild->content == (xmlChar *)&(lastChild->properties)) {
2575 lastChild->content = xmlStrdup(lastChild->content);
2576 lastChild->properties = NULL;
2577 } else if ((ctxt->nodemem == ctxt->nodelen + 1) &&
2578 (xmlDictOwns(ctxt->dict, lastChild->content))) {
2579 lastChild->content = xmlStrdup(lastChild->content);
2581 if (lastChild->content == NULL) {
2582 xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters: xmlStrdup returned NULL");
2585 if (((size_t)ctxt->nodelen + (size_t)len > XML_MAX_TEXT_LENGTH) &&
2586 ((ctxt->options & XML_PARSE_HUGE) == 0)) {
2587 xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters: huge text node");
2590 if ((size_t)ctxt->nodelen > SIZE_T_MAX - (size_t)len ||
2591 (size_t)ctxt->nodemem + (size_t)len > SIZE_T_MAX / 2) {
2592 xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters overflow prevented");
2595 if (ctxt->nodelen + len >= ctxt->nodemem) {
2599 size = ctxt->nodemem + len;
2601 newbuf = (xmlChar *) xmlRealloc(lastChild->content,size);
2602 if (newbuf == NULL) {
2603 xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters");
2606 ctxt->nodemem = size;
2607 lastChild->content = newbuf;
2609 memcpy(&lastChild->content[ctxt->nodelen], ch, len);
2610 ctxt->nodelen += len;
2611 lastChild->content[ctxt->nodelen] = 0;
2612 } else if (coalesceText) {
2613 if (xmlTextConcat(lastChild, ch, len)) {
2614 xmlSAX2ErrMemory(ctxt, "xmlSAX2Characters");
2616 if (ctxt->node->children != NULL) {
2617 ctxt->nodelen = xmlStrlen(lastChild->content);
2618 ctxt->nodemem = ctxt->nodelen + 1;
2621 /* Mixed content, first time */
2622 lastChild = xmlSAX2TextNode(ctxt, ch, len);
2623 if (lastChild != NULL) {
2624 xmlAddChild(ctxt->node, lastChild);
2625 if (ctxt->node->children != NULL) {
2626 ctxt->nodelen = len;
2627 ctxt->nodemem = len + 1;
2635 * xmlSAX2IgnorableWhitespace:
2636 * @ctx: the user data (XML parser context)
2637 * @ch: a xmlChar string
2638 * @len: the number of xmlChar
2640 * receiving some ignorable whitespaces from the parser.
2641 * UNUSED: by default the DOM building will use xmlSAX2Characters
2644 xmlSAX2IgnorableWhitespace(void *ctx ATTRIBUTE_UNUSED, const xmlChar *ch ATTRIBUTE_UNUSED, int len ATTRIBUTE_UNUSED)
2646 /* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
2648 xmlGenericError(xmlGenericErrorContext,
2649 "SAX.xmlSAX2IgnorableWhitespace(%.30s, %d)\n", ch, len);
2654 * xmlSAX2ProcessingInstruction:
2655 * @ctx: the user data (XML parser context)
2656 * @target: the target name
2657 * @data: the PI data's
2659 * A processing instruction has been parsed.
2662 xmlSAX2ProcessingInstruction(void *ctx, const xmlChar *target,
2663 const xmlChar *data)
2665 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2669 if (ctx == NULL) return;
2670 parent = ctxt->node;
2672 xmlGenericError(xmlGenericErrorContext,
2673 "SAX.xmlSAX2ProcessingInstruction(%s, %s)\n", target, data);
2676 ret = xmlNewDocPI(ctxt->myDoc, target, data);
2677 if (ret == NULL) return;
2679 if (ctxt->linenumbers) {
2680 if (ctxt->input != NULL) {
2681 if (ctxt->input->line < 65535)
2682 ret->line = (short) ctxt->input->line;
2687 if (ctxt->inSubset == 1) {
2688 xmlAddChild((xmlNodePtr) ctxt->myDoc->intSubset, ret);
2690 } else if (ctxt->inSubset == 2) {
2691 xmlAddChild((xmlNodePtr) ctxt->myDoc->extSubset, ret);
2694 if (parent == NULL) {
2695 #ifdef DEBUG_SAX_TREE
2696 xmlGenericError(xmlGenericErrorContext,
2697 "Setting PI %s as root\n", target);
2699 xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
2702 if (parent->type == XML_ELEMENT_NODE) {
2703 #ifdef DEBUG_SAX_TREE
2704 xmlGenericError(xmlGenericErrorContext,
2705 "adding PI %s child to %s\n", target, parent->name);
2707 xmlAddChild(parent, ret);
2709 #ifdef DEBUG_SAX_TREE
2710 xmlGenericError(xmlGenericErrorContext,
2711 "adding PI %s sibling to ", target);
2712 xmlDebugDumpOneNode(stderr, parent, 0);
2714 xmlAddSibling(parent, ret);
2720 * @ctx: the user data (XML parser context)
2721 * @value: the xmlSAX2Comment content
2723 * A xmlSAX2Comment has been parsed.
2726 xmlSAX2Comment(void *ctx, const xmlChar *value)
2728 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2732 if (ctx == NULL) return;
2733 parent = ctxt->node;
2735 xmlGenericError(xmlGenericErrorContext, "SAX.xmlSAX2Comment(%s)\n", value);
2737 ret = xmlNewDocComment(ctxt->myDoc, value);
2738 if (ret == NULL) return;
2739 if (ctxt->linenumbers) {
2740 if (ctxt->input != NULL) {
2741 if (ctxt->input->line < 65535)
2742 ret->line = (short) ctxt->input->line;
2748 if (ctxt->inSubset == 1) {
2749 xmlAddChild((xmlNodePtr) ctxt->myDoc->intSubset, ret);
2751 } else if (ctxt->inSubset == 2) {
2752 xmlAddChild((xmlNodePtr) ctxt->myDoc->extSubset, ret);
2755 if (parent == NULL) {
2756 #ifdef DEBUG_SAX_TREE
2757 xmlGenericError(xmlGenericErrorContext,
2758 "Setting xmlSAX2Comment as root\n");
2760 xmlAddChild((xmlNodePtr) ctxt->myDoc, (xmlNodePtr) ret);
2763 if (parent->type == XML_ELEMENT_NODE) {
2764 #ifdef DEBUG_SAX_TREE
2765 xmlGenericError(xmlGenericErrorContext,
2766 "adding xmlSAX2Comment child to %s\n", parent->name);
2768 xmlAddChild(parent, ret);
2770 #ifdef DEBUG_SAX_TREE
2771 xmlGenericError(xmlGenericErrorContext,
2772 "adding xmlSAX2Comment sibling to ");
2773 xmlDebugDumpOneNode(stderr, parent, 0);
2775 xmlAddSibling(parent, ret);
2780 * xmlSAX2CDataBlock:
2781 * @ctx: the user data (XML parser context)
2782 * @value: The pcdata content
2783 * @len: the block length
2785 * called when a pcdata block has been parsed
2788 xmlSAX2CDataBlock(void *ctx, const xmlChar *value, int len)
2790 xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx;
2791 xmlNodePtr ret, lastChild;
2793 if (ctx == NULL) return;
2795 xmlGenericError(xmlGenericErrorContext,
2796 "SAX.pcdata(%.10s, %d)\n", value, len);
2798 lastChild = xmlGetLastChild(ctxt->node);
2799 #ifdef DEBUG_SAX_TREE
2800 xmlGenericError(xmlGenericErrorContext,
2801 "add chars to %s \n", ctxt->node->name);
2803 if ((lastChild != NULL) &&
2804 (lastChild->type == XML_CDATA_SECTION_NODE)) {
2805 xmlTextConcat(lastChild, value, len);
2807 ret = xmlNewCDataBlock(ctxt->myDoc, value, len);
2808 xmlAddChild(ctxt->node, ret);
2812 static int xmlSAX2DefaultVersionValue = 2;
2814 #ifdef LIBXML_SAX1_ENABLED
2816 * xmlSAXDefaultVersion:
2817 * @version: the version, 1 or 2
2819 * Set the default version of SAX used globally by the library.
2820 * By default, during initialization the default is set to 2.
2821 * Note that it is generally a better coding style to use
2822 * xmlSAXVersion() to set up the version explicitly for a given
2825 * Returns the previous value in case of success and -1 in case of error.
2828 xmlSAXDefaultVersion(int version)
2830 int ret = xmlSAX2DefaultVersionValue;
2832 if ((version != 1) && (version != 2))
2834 xmlSAX2DefaultVersionValue = version;
2837 #endif /* LIBXML_SAX1_ENABLED */
2841 * @hdlr: the SAX handler
2842 * @version: the version, 1 or 2
2844 * Initialize the default XML SAX handler according to the version
2846 * Returns 0 in case of success and -1 in case of error.
2849 xmlSAXVersion(xmlSAXHandler *hdlr, int version)
2851 if (hdlr == NULL) return(-1);
2853 hdlr->startElement = NULL;
2854 hdlr->endElement = NULL;
2855 hdlr->startElementNs = xmlSAX2StartElementNs;
2856 hdlr->endElementNs = xmlSAX2EndElementNs;
2857 hdlr->serror = NULL;
2858 hdlr->initialized = XML_SAX2_MAGIC;
2859 #ifdef LIBXML_SAX1_ENABLED
2860 } else if (version == 1) {
2861 hdlr->startElement = xmlSAX2StartElement;
2862 hdlr->endElement = xmlSAX2EndElement;
2863 hdlr->initialized = 1;
2864 #endif /* LIBXML_SAX1_ENABLED */
2867 hdlr->internalSubset = xmlSAX2InternalSubset;
2868 hdlr->externalSubset = xmlSAX2ExternalSubset;
2869 hdlr->isStandalone = xmlSAX2IsStandalone;
2870 hdlr->hasInternalSubset = xmlSAX2HasInternalSubset;
2871 hdlr->hasExternalSubset = xmlSAX2HasExternalSubset;
2872 hdlr->resolveEntity = xmlSAX2ResolveEntity;
2873 hdlr->getEntity = xmlSAX2GetEntity;
2874 hdlr->getParameterEntity = xmlSAX2GetParameterEntity;
2875 hdlr->entityDecl = xmlSAX2EntityDecl;
2876 hdlr->attributeDecl = xmlSAX2AttributeDecl;
2877 hdlr->elementDecl = xmlSAX2ElementDecl;
2878 hdlr->notationDecl = xmlSAX2NotationDecl;
2879 hdlr->unparsedEntityDecl = xmlSAX2UnparsedEntityDecl;
2880 hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator;
2881 hdlr->startDocument = xmlSAX2StartDocument;
2882 hdlr->endDocument = xmlSAX2EndDocument;
2883 hdlr->reference = xmlSAX2Reference;
2884 hdlr->characters = xmlSAX2Characters;
2885 hdlr->cdataBlock = xmlSAX2CDataBlock;
2886 hdlr->ignorableWhitespace = xmlSAX2Characters;
2887 hdlr->processingInstruction = xmlSAX2ProcessingInstruction;
2888 hdlr->comment = xmlSAX2Comment;
2889 hdlr->warning = xmlParserWarning;
2890 hdlr->error = xmlParserError;
2891 hdlr->fatalError = xmlParserError;
2897 * xmlSAX2InitDefaultSAXHandler:
2898 * @hdlr: the SAX handler
2899 * @warning: flag if non-zero sets the handler warning procedure
2901 * Initialize the default XML SAX2 handler
2904 xmlSAX2InitDefaultSAXHandler(xmlSAXHandler *hdlr, int warning)
2906 if ((hdlr == NULL) || (hdlr->initialized != 0))
2909 xmlSAXVersion(hdlr, xmlSAX2DefaultVersionValue);
2911 hdlr->warning = NULL;
2913 hdlr->warning = xmlParserWarning;
2917 * xmlDefaultSAXHandlerInit:
2919 * Initialize the default SAX2 handler
2922 xmlDefaultSAXHandlerInit(void)
2924 #ifdef LIBXML_SAX1_ENABLED
2925 xmlSAXVersion((xmlSAXHandlerPtr) &xmlDefaultSAXHandler, 1);
2926 #endif /* LIBXML_SAX1_ENABLED */
2929 #ifdef LIBXML_HTML_ENABLED
2932 * xmlSAX2InitHtmlDefaultSAXHandler:
2933 * @hdlr: the SAX handler
2935 * Initialize the default HTML SAX2 handler
2938 xmlSAX2InitHtmlDefaultSAXHandler(xmlSAXHandler *hdlr)
2940 if ((hdlr == NULL) || (hdlr->initialized != 0))
2943 hdlr->internalSubset = xmlSAX2InternalSubset;
2944 hdlr->externalSubset = NULL;
2945 hdlr->isStandalone = NULL;
2946 hdlr->hasInternalSubset = NULL;
2947 hdlr->hasExternalSubset = NULL;
2948 hdlr->resolveEntity = NULL;
2949 hdlr->getEntity = xmlSAX2GetEntity;
2950 hdlr->getParameterEntity = NULL;
2951 hdlr->entityDecl = NULL;
2952 hdlr->attributeDecl = NULL;
2953 hdlr->elementDecl = NULL;
2954 hdlr->notationDecl = NULL;
2955 hdlr->unparsedEntityDecl = NULL;
2956 hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator;
2957 hdlr->startDocument = xmlSAX2StartDocument;
2958 hdlr->endDocument = xmlSAX2EndDocument;
2959 hdlr->startElement = xmlSAX2StartElement;
2960 hdlr->endElement = xmlSAX2EndElement;
2961 hdlr->reference = NULL;
2962 hdlr->characters = xmlSAX2Characters;
2963 hdlr->cdataBlock = xmlSAX2CDataBlock;
2964 hdlr->ignorableWhitespace = xmlSAX2IgnorableWhitespace;
2965 hdlr->processingInstruction = xmlSAX2ProcessingInstruction;
2966 hdlr->comment = xmlSAX2Comment;
2967 hdlr->warning = xmlParserWarning;
2968 hdlr->error = xmlParserError;
2969 hdlr->fatalError = xmlParserError;
2971 hdlr->initialized = 1;
2975 * htmlDefaultSAXHandlerInit:
2977 * Initialize the default SAX handler
2980 htmlDefaultSAXHandlerInit(void)
2982 xmlSAX2InitHtmlDefaultSAXHandler((xmlSAXHandlerPtr) &htmlDefaultSAXHandler);
2985 #endif /* LIBXML_HTML_ENABLED */
2987 #ifdef LIBXML_DOCB_ENABLED
2990 * xmlSAX2InitDocbDefaultSAXHandler:
2991 * @hdlr: the SAX handler
2993 * Initialize the default DocBook SAX2 handler
2996 xmlSAX2InitDocbDefaultSAXHandler(xmlSAXHandler *hdlr)
2998 if ((hdlr == NULL) || (hdlr->initialized != 0))
3001 hdlr->internalSubset = xmlSAX2InternalSubset;
3002 hdlr->externalSubset = NULL;
3003 hdlr->isStandalone = xmlSAX2IsStandalone;
3004 hdlr->hasInternalSubset = xmlSAX2HasInternalSubset;
3005 hdlr->hasExternalSubset = xmlSAX2HasExternalSubset;
3006 hdlr->resolveEntity = xmlSAX2ResolveEntity;
3007 hdlr->getEntity = xmlSAX2GetEntity;
3008 hdlr->getParameterEntity = NULL;
3009 hdlr->entityDecl = xmlSAX2EntityDecl;
3010 hdlr->attributeDecl = NULL;
3011 hdlr->elementDecl = NULL;
3012 hdlr->notationDecl = NULL;
3013 hdlr->unparsedEntityDecl = NULL;
3014 hdlr->setDocumentLocator = xmlSAX2SetDocumentLocator;
3015 hdlr->startDocument = xmlSAX2StartDocument;
3016 hdlr->endDocument = xmlSAX2EndDocument;
3017 hdlr->startElement = xmlSAX2StartElement;
3018 hdlr->endElement = xmlSAX2EndElement;
3019 hdlr->reference = xmlSAX2Reference;
3020 hdlr->characters = xmlSAX2Characters;
3021 hdlr->cdataBlock = NULL;
3022 hdlr->ignorableWhitespace = xmlSAX2IgnorableWhitespace;
3023 hdlr->processingInstruction = NULL;
3024 hdlr->comment = xmlSAX2Comment;
3025 hdlr->warning = xmlParserWarning;
3026 hdlr->error = xmlParserError;
3027 hdlr->fatalError = xmlParserError;
3029 hdlr->initialized = 1;
3033 * docbDefaultSAXHandlerInit:
3035 * Initialize the default SAX handler
3038 docbDefaultSAXHandlerInit(void)
3040 xmlSAX2InitDocbDefaultSAXHandler((xmlSAXHandlerPtr) &docbDefaultSAXHandler);
3043 #endif /* LIBXML_DOCB_ENABLED */
3045 #include "elfgcchack.h"