mirror of
				https://gitlab.gnome.org/GNOME/libxml2.git
				synced 2025-10-24 13:33:01 +03:00 
			
		
		
		
	
		
			
				
	
	
		
			15199 lines
		
	
	
		
			422 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
			
		
		
	
	
			15199 lines
		
	
	
		
			422 KiB
		
	
	
	
		
			C
		
	
	
	
	
	
| /*
 | |
|  * parser.c : an XML 1.0 parser, namespaces and validity support are mostly
 | |
|  *            implemented on top of the SAX interfaces
 | |
|  *
 | |
|  * References:
 | |
|  *   The XML specification:
 | |
|  *     http://www.w3.org/TR/REC-xml
 | |
|  *   Original 1.0 version:
 | |
|  *     http://www.w3.org/TR/1998/REC-xml-19980210
 | |
|  *   XML second edition working draft
 | |
|  *     http://www.w3.org/TR/2000/WD-xml-2e-20000814
 | |
|  *
 | |
|  * Okay this is a big file, the parser core is around 7000 lines, then it
 | |
|  * is followed by the progressive parser top routines, then the various
 | |
|  * high level APIs to call the parser and a few miscellaneous functions.
 | |
|  * A number of helper functions and deprecated ones have been moved to
 | |
|  * parserInternals.c to reduce this file size.
 | |
|  * As much as possible the functions are associated with their relative
 | |
|  * production in the XML specification. A few productions defining the
 | |
|  * different ranges of character are actually implanted either in
 | |
|  * parserInternals.h or parserInternals.c
 | |
|  * The DOM tree build is realized from the default SAX callbacks in
 | |
|  * the module SAX.c.
 | |
|  * The routines doing the validation checks are in valid.c and called either
 | |
|  * from the SAX callbacks or as standalone functions using a preparsed
 | |
|  * document.
 | |
|  *
 | |
|  * See Copyright for the status of this software.
 | |
|  *
 | |
|  * daniel@veillard.com
 | |
|  */
 | |
| 
 | |
| /* To avoid EBCDIC trouble when parsing on zOS */
 | |
| #if defined(__MVS__)
 | |
| #pragma convert("ISO8859-1")
 | |
| #endif
 | |
| 
 | |
| #define IN_LIBXML
 | |
| #include "libxml.h"
 | |
| 
 | |
| #if defined(_WIN32)
 | |
| #define XML_DIR_SEP '\\'
 | |
| #else
 | |
| #define XML_DIR_SEP '/'
 | |
| #endif
 | |
| 
 | |
| #include <stdlib.h>
 | |
| #include <limits.h>
 | |
| #include <string.h>
 | |
| #include <stdarg.h>
 | |
| #include <stddef.h>
 | |
| #include <ctype.h>
 | |
| #include <stdlib.h>
 | |
| #include <libxml/parser.h>
 | |
| #include <libxml/xmlmemory.h>
 | |
| #include <libxml/tree.h>
 | |
| #include <libxml/parserInternals.h>
 | |
| #include <libxml/valid.h>
 | |
| #include <libxml/entities.h>
 | |
| #include <libxml/xmlerror.h>
 | |
| #include <libxml/encoding.h>
 | |
| #include <libxml/xmlIO.h>
 | |
| #include <libxml/uri.h>
 | |
| #include <libxml/SAX2.h>
 | |
| #ifdef LIBXML_CATALOG_ENABLED
 | |
| #include <libxml/catalog.h>
 | |
| #endif
 | |
| 
 | |
| #include "private/buf.h"
 | |
| #include "private/dict.h"
 | |
| #include "private/entities.h"
 | |
| #include "private/error.h"
 | |
| #include "private/html.h"
 | |
| #include "private/io.h"
 | |
| #include "private/parser.h"
 | |
| 
 | |
| #define NS_INDEX_EMPTY  INT_MAX
 | |
| #define NS_INDEX_XML    (INT_MAX - 1)
 | |
| #define URI_HASH_EMPTY  0xD943A04E
 | |
| #define URI_HASH_XML    0xF0451F02
 | |
| 
 | |
| struct _xmlStartTag {
 | |
|     const xmlChar *prefix;
 | |
|     const xmlChar *URI;
 | |
|     int line;
 | |
|     int nsNr;
 | |
| };
 | |
| 
 | |
| typedef struct {
 | |
|     void *saxData;
 | |
|     unsigned prefixHashValue;
 | |
|     unsigned uriHashValue;
 | |
|     unsigned elementId;
 | |
|     int oldIndex;
 | |
| } xmlParserNsExtra;
 | |
| 
 | |
| typedef struct {
 | |
|     unsigned hashValue;
 | |
|     int index;
 | |
| } xmlParserNsBucket;
 | |
| 
 | |
| struct _xmlParserNsData {
 | |
|     xmlParserNsExtra *extra;
 | |
| 
 | |
|     unsigned hashSize;
 | |
|     unsigned hashElems;
 | |
|     xmlParserNsBucket *hash;
 | |
| 
 | |
|     unsigned elementId;
 | |
|     int defaultNsIndex;
 | |
| };
 | |
| 
 | |
| struct _xmlAttrHashBucket {
 | |
|     unsigned hashValue;
 | |
|     int index;
 | |
| };
 | |
| 
 | |
| static xmlParserCtxtPtr
 | |
| xmlCreateEntityParserCtxtInternal(xmlSAXHandlerPtr sax, void *userData,
 | |
|         const xmlChar *URL, const xmlChar *ID, const xmlChar *base,
 | |
|         xmlParserCtxtPtr pctx);
 | |
| 
 | |
| static int
 | |
| xmlParseElementStart(xmlParserCtxtPtr ctxt);
 | |
| 
 | |
| static void
 | |
| xmlParseElementEnd(xmlParserCtxtPtr ctxt);
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *	Arbitrary limits set in the parser. See XML_PARSE_HUGE		*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| #define XML_PARSER_BIG_ENTITY 1000
 | |
| #define XML_PARSER_LOT_ENTITY 5000
 | |
| 
 | |
| /*
 | |
|  * Constants for protection against abusive entity expansion
 | |
|  * ("billion laughs").
 | |
|  */
 | |
| 
 | |
| /*
 | |
|  * A certain amount of entity expansion which is always allowed.
 | |
|  */
 | |
| #define XML_PARSER_ALLOWED_EXPANSION 1000000
 | |
| 
 | |
| /*
 | |
|  * Fixed cost for each entity reference. This crudely models processing time
 | |
|  * as well to protect, for example, against exponential expansion of empty
 | |
|  * or very short entities.
 | |
|  */
 | |
| #define XML_ENT_FIXED_COST 20
 | |
| 
 | |
| /**
 | |
|  * xmlParserMaxDepth:
 | |
|  *
 | |
|  * arbitrary depth limit for the XML documents that we allow to
 | |
|  * process. This is not a limitation of the parser but a safety
 | |
|  * boundary feature. It can be disabled with the XML_PARSE_HUGE
 | |
|  * parser option.
 | |
|  */
 | |
| unsigned int xmlParserMaxDepth = 256;
 | |
| 
 | |
| 
 | |
| 
 | |
| #define XML_PARSER_BIG_BUFFER_SIZE 300
 | |
| #define XML_PARSER_BUFFER_SIZE 100
 | |
| #define SAX_COMPAT_MODE BAD_CAST "SAX compatibility mode document"
 | |
| 
 | |
| /**
 | |
|  * XML_PARSER_CHUNK_SIZE
 | |
|  *
 | |
|  * When calling GROW that's the minimal amount of data
 | |
|  * the parser expected to have received. It is not a hard
 | |
|  * limit but an optimization when reading strings like Names
 | |
|  * It is not strictly needed as long as inputs available characters
 | |
|  * are followed by 0, which should be provided by the I/O level
 | |
|  */
 | |
| #define XML_PARSER_CHUNK_SIZE 100
 | |
| 
 | |
| /**
 | |
|  * xmlParserVersion:
 | |
|  *
 | |
|  * Constant string describing the internal version of the library
 | |
|  */
 | |
| const char *const
 | |
| xmlParserVersion = LIBXML_VERSION_STRING LIBXML_VERSION_EXTRA;
 | |
| 
 | |
| /*
 | |
|  * List of XML prefixed PI allowed by W3C specs
 | |
|  */
 | |
| 
 | |
| static const char* const xmlW3CPIs[] = {
 | |
|     "xml-stylesheet",
 | |
|     "xml-model",
 | |
|     NULL
 | |
| };
 | |
| 
 | |
| 
 | |
| /* DEPR void xmlParserHandleReference(xmlParserCtxtPtr ctxt); */
 | |
| static xmlEntityPtr xmlParseStringPEReference(xmlParserCtxtPtr ctxt,
 | |
|                                               const xmlChar **str);
 | |
| 
 | |
| static xmlParserErrors
 | |
| xmlParseExternalEntityPrivate(xmlDocPtr doc, xmlParserCtxtPtr oldctxt,
 | |
| 	              xmlSAXHandlerPtr sax,
 | |
| 		      void *user_data, int depth, const xmlChar *URL,
 | |
| 		      const xmlChar *ID, xmlNodePtr *list);
 | |
| 
 | |
| static int
 | |
| xmlCtxtUseOptionsInternal(xmlParserCtxtPtr ctxt, int options,
 | |
|                           const char *encoding);
 | |
| #ifdef LIBXML_LEGACY_ENABLED
 | |
| static void
 | |
| xmlAddEntityReference(xmlEntityPtr ent, xmlNodePtr firstNode,
 | |
|                       xmlNodePtr lastNode);
 | |
| #endif /* LIBXML_LEGACY_ENABLED */
 | |
| 
 | |
| static xmlParserErrors
 | |
| xmlParseBalancedChunkMemoryInternal(xmlParserCtxtPtr oldctxt,
 | |
| 		      const xmlChar *string, void *user_data, xmlNodePtr *lst);
 | |
| 
 | |
| static int
 | |
| xmlLoadEntityContent(xmlParserCtxtPtr ctxt, xmlEntityPtr entity);
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		Some factorized error routines				*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * xmlErrAttributeDup:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @prefix:  the attribute prefix
 | |
|  * @localname:  the attribute localname
 | |
|  *
 | |
|  * Handle a redefinition of attribute error
 | |
|  */
 | |
| static void
 | |
| xmlErrAttributeDup(xmlParserCtxtPtr ctxt, const xmlChar * prefix,
 | |
|                    const xmlChar * localname)
 | |
| {
 | |
|     if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
 | |
|         (ctxt->instate == XML_PARSER_EOF))
 | |
| 	return;
 | |
|     if (ctxt != NULL)
 | |
| 	ctxt->errNo = XML_ERR_ATTRIBUTE_REDEFINED;
 | |
| 
 | |
|     if (prefix == NULL)
 | |
|         __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER,
 | |
|                         XML_ERR_ATTRIBUTE_REDEFINED, XML_ERR_FATAL, NULL, 0,
 | |
|                         (const char *) localname, NULL, NULL, 0, 0,
 | |
|                         "Attribute %s redefined\n", localname);
 | |
|     else
 | |
|         __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER,
 | |
|                         XML_ERR_ATTRIBUTE_REDEFINED, XML_ERR_FATAL, NULL, 0,
 | |
|                         (const char *) prefix, (const char *) localname,
 | |
|                         NULL, 0, 0, "Attribute %s:%s redefined\n", prefix,
 | |
|                         localname);
 | |
|     if (ctxt != NULL) {
 | |
| 	ctxt->wellFormed = 0;
 | |
| 	if (ctxt->recovery == 0)
 | |
| 	    ctxt->disableSAX = 1;
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlFatalErrMsg:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @error:  the error number
 | |
|  * @msg:  the error message
 | |
|  *
 | |
|  * Handle a fatal parser error, i.e. violating Well-Formedness constraints
 | |
|  */
 | |
| static void LIBXML_ATTR_FORMAT(3,0)
 | |
| xmlFatalErrMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
 | |
|                const char *msg)
 | |
| {
 | |
|     if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
 | |
|         (ctxt->instate == XML_PARSER_EOF))
 | |
| 	return;
 | |
|     if (ctxt != NULL)
 | |
| 	ctxt->errNo = error;
 | |
|     __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER, error,
 | |
|                     XML_ERR_FATAL, NULL, 0, NULL, NULL, NULL, 0, 0, "%s", msg);
 | |
|     if (ctxt != NULL) {
 | |
| 	ctxt->wellFormed = 0;
 | |
| 	if (ctxt->recovery == 0)
 | |
| 	    ctxt->disableSAX = 1;
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlWarningMsg:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @error:  the error number
 | |
|  * @msg:  the error message
 | |
|  * @str1:  extra data
 | |
|  * @str2:  extra data
 | |
|  *
 | |
|  * Handle a warning.
 | |
|  */
 | |
| void LIBXML_ATTR_FORMAT(3,0)
 | |
| xmlWarningMsg(xmlParserCtxtPtr ctxt, xmlParserErrors error,
 | |
|               const char *msg, const xmlChar *str1, const xmlChar *str2)
 | |
| {
 | |
|     xmlStructuredErrorFunc schannel = NULL;
 | |
| 
 | |
|     if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
 | |
|         (ctxt->instate == XML_PARSER_EOF))
 | |
| 	return;
 | |
|     if ((ctxt != NULL) && (ctxt->sax != NULL) &&
 | |
|         (ctxt->sax->initialized == XML_SAX2_MAGIC))
 | |
|         schannel = ctxt->sax->serror;
 | |
|     if (ctxt != NULL) {
 | |
|         __xmlRaiseError(schannel,
 | |
|                     (ctxt->sax) ? ctxt->sax->warning : NULL,
 | |
|                     ctxt->userData,
 | |
|                     ctxt, NULL, XML_FROM_PARSER, error,
 | |
|                     XML_ERR_WARNING, NULL, 0,
 | |
| 		    (const char *) str1, (const char *) str2, NULL, 0, 0,
 | |
| 		    msg, (const char *) str1, (const char *) str2);
 | |
|     } else {
 | |
|         __xmlRaiseError(schannel, NULL, NULL,
 | |
|                     ctxt, NULL, XML_FROM_PARSER, error,
 | |
|                     XML_ERR_WARNING, NULL, 0,
 | |
| 		    (const char *) str1, (const char *) str2, NULL, 0, 0,
 | |
| 		    msg, (const char *) str1, (const char *) str2);
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlValidityError:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @error:  the error number
 | |
|  * @msg:  the error message
 | |
|  * @str1:  extra data
 | |
|  *
 | |
|  * Handle a validity error.
 | |
|  */
 | |
| static void LIBXML_ATTR_FORMAT(3,0)
 | |
| xmlValidityError(xmlParserCtxtPtr ctxt, xmlParserErrors error,
 | |
|               const char *msg, const xmlChar *str1, const xmlChar *str2)
 | |
| {
 | |
|     xmlStructuredErrorFunc schannel = NULL;
 | |
| 
 | |
|     if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
 | |
|         (ctxt->instate == XML_PARSER_EOF))
 | |
| 	return;
 | |
|     if (ctxt != NULL) {
 | |
| 	ctxt->errNo = error;
 | |
| 	if ((ctxt->sax != NULL) && (ctxt->sax->initialized == XML_SAX2_MAGIC))
 | |
| 	    schannel = ctxt->sax->serror;
 | |
|     }
 | |
|     if (ctxt != NULL) {
 | |
|         __xmlRaiseError(schannel,
 | |
|                     ctxt->vctxt.error, ctxt->vctxt.userData,
 | |
|                     ctxt, NULL, XML_FROM_DTD, error,
 | |
|                     XML_ERR_ERROR, NULL, 0, (const char *) str1,
 | |
| 		    (const char *) str2, NULL, 0, 0,
 | |
| 		    msg, (const char *) str1, (const char *) str2);
 | |
| 	ctxt->valid = 0;
 | |
|     } else {
 | |
|         __xmlRaiseError(schannel, NULL, NULL,
 | |
|                     ctxt, NULL, XML_FROM_DTD, error,
 | |
|                     XML_ERR_ERROR, NULL, 0, (const char *) str1,
 | |
| 		    (const char *) str2, NULL, 0, 0,
 | |
| 		    msg, (const char *) str1, (const char *) str2);
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlFatalErrMsgInt:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @error:  the error number
 | |
|  * @msg:  the error message
 | |
|  * @val:  an integer value
 | |
|  *
 | |
|  * Handle a fatal parser error, i.e. violating Well-Formedness constraints
 | |
|  */
 | |
| static void LIBXML_ATTR_FORMAT(3,0)
 | |
| xmlFatalErrMsgInt(xmlParserCtxtPtr ctxt, xmlParserErrors error,
 | |
|                   const char *msg, int val)
 | |
| {
 | |
|     if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
 | |
|         (ctxt->instate == XML_PARSER_EOF))
 | |
| 	return;
 | |
|     if (ctxt != NULL)
 | |
| 	ctxt->errNo = error;
 | |
|     __xmlRaiseError(NULL, NULL, NULL,
 | |
|                     ctxt, NULL, XML_FROM_PARSER, error, XML_ERR_FATAL,
 | |
|                     NULL, 0, NULL, NULL, NULL, val, 0, msg, val);
 | |
|     if (ctxt != NULL) {
 | |
| 	ctxt->wellFormed = 0;
 | |
| 	if (ctxt->recovery == 0)
 | |
| 	    ctxt->disableSAX = 1;
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlFatalErrMsgStrIntStr:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @error:  the error number
 | |
|  * @msg:  the error message
 | |
|  * @str1:  an string info
 | |
|  * @val:  an integer value
 | |
|  * @str2:  an string info
 | |
|  *
 | |
|  * Handle a fatal parser error, i.e. violating Well-Formedness constraints
 | |
|  */
 | |
| static void LIBXML_ATTR_FORMAT(3,0)
 | |
| xmlFatalErrMsgStrIntStr(xmlParserCtxtPtr ctxt, xmlParserErrors error,
 | |
|                   const char *msg, const xmlChar *str1, int val,
 | |
| 		  const xmlChar *str2)
 | |
| {
 | |
|     if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
 | |
|         (ctxt->instate == XML_PARSER_EOF))
 | |
| 	return;
 | |
|     if (ctxt != NULL)
 | |
| 	ctxt->errNo = error;
 | |
|     __xmlRaiseError(NULL, NULL, NULL,
 | |
|                     ctxt, NULL, XML_FROM_PARSER, error, XML_ERR_FATAL,
 | |
|                     NULL, 0, (const char *) str1, (const char *) str2,
 | |
| 		    NULL, val, 0, msg, str1, val, str2);
 | |
|     if (ctxt != NULL) {
 | |
| 	ctxt->wellFormed = 0;
 | |
| 	if (ctxt->recovery == 0)
 | |
| 	    ctxt->disableSAX = 1;
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlFatalErrMsgStr:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @error:  the error number
 | |
|  * @msg:  the error message
 | |
|  * @val:  a string value
 | |
|  *
 | |
|  * Handle a fatal parser error, i.e. violating Well-Formedness constraints
 | |
|  */
 | |
| static void LIBXML_ATTR_FORMAT(3,0)
 | |
| xmlFatalErrMsgStr(xmlParserCtxtPtr ctxt, xmlParserErrors error,
 | |
|                   const char *msg, const xmlChar * val)
 | |
| {
 | |
|     if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
 | |
|         (ctxt->instate == XML_PARSER_EOF))
 | |
| 	return;
 | |
|     if (ctxt != NULL)
 | |
| 	ctxt->errNo = error;
 | |
|     __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL,
 | |
|                     XML_FROM_PARSER, error, XML_ERR_FATAL,
 | |
|                     NULL, 0, (const char *) val, NULL, NULL, 0, 0, msg,
 | |
|                     val);
 | |
|     if (ctxt != NULL) {
 | |
| 	ctxt->wellFormed = 0;
 | |
| 	if (ctxt->recovery == 0)
 | |
| 	    ctxt->disableSAX = 1;
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlErrMsgStr:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @error:  the error number
 | |
|  * @msg:  the error message
 | |
|  * @val:  a string value
 | |
|  *
 | |
|  * Handle a non fatal parser error
 | |
|  */
 | |
| static void LIBXML_ATTR_FORMAT(3,0)
 | |
| xmlErrMsgStr(xmlParserCtxtPtr ctxt, xmlParserErrors error,
 | |
|                   const char *msg, const xmlChar * val)
 | |
| {
 | |
|     if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
 | |
|         (ctxt->instate == XML_PARSER_EOF))
 | |
| 	return;
 | |
|     if (ctxt != NULL)
 | |
| 	ctxt->errNo = error;
 | |
|     __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL,
 | |
|                     XML_FROM_PARSER, error, XML_ERR_ERROR,
 | |
|                     NULL, 0, (const char *) val, NULL, NULL, 0, 0, msg,
 | |
|                     val);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlNsErr:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @error:  the error number
 | |
|  * @msg:  the message
 | |
|  * @info1:  extra information string
 | |
|  * @info2:  extra information string
 | |
|  *
 | |
|  * Handle a fatal parser error, i.e. violating Well-Formedness constraints
 | |
|  */
 | |
| static void LIBXML_ATTR_FORMAT(3,0)
 | |
| xmlNsErr(xmlParserCtxtPtr ctxt, xmlParserErrors error,
 | |
|          const char *msg,
 | |
|          const xmlChar * info1, const xmlChar * info2,
 | |
|          const xmlChar * info3)
 | |
| {
 | |
|     if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
 | |
|         (ctxt->instate == XML_PARSER_EOF))
 | |
| 	return;
 | |
|     if (ctxt != NULL)
 | |
| 	ctxt->errNo = error;
 | |
|     __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_NAMESPACE, error,
 | |
|                     XML_ERR_ERROR, NULL, 0, (const char *) info1,
 | |
|                     (const char *) info2, (const char *) info3, 0, 0, msg,
 | |
|                     info1, info2, info3);
 | |
|     if (ctxt != NULL)
 | |
| 	ctxt->nsWellFormed = 0;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlNsWarn
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @error:  the error number
 | |
|  * @msg:  the message
 | |
|  * @info1:  extra information string
 | |
|  * @info2:  extra information string
 | |
|  *
 | |
|  * Handle a namespace warning error
 | |
|  */
 | |
| static void LIBXML_ATTR_FORMAT(3,0)
 | |
| xmlNsWarn(xmlParserCtxtPtr ctxt, xmlParserErrors error,
 | |
|          const char *msg,
 | |
|          const xmlChar * info1, const xmlChar * info2,
 | |
|          const xmlChar * info3)
 | |
| {
 | |
|     if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&
 | |
|         (ctxt->instate == XML_PARSER_EOF))
 | |
| 	return;
 | |
|     __xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_NAMESPACE, error,
 | |
|                     XML_ERR_WARNING, NULL, 0, (const char *) info1,
 | |
|                     (const char *) info2, (const char *) info3, 0, 0, msg,
 | |
|                     info1, info2, info3);
 | |
| }
 | |
| 
 | |
| static void
 | |
| xmlSaturatedAdd(unsigned long *dst, unsigned long val) {
 | |
|     if (val > ULONG_MAX - *dst)
 | |
|         *dst = ULONG_MAX;
 | |
|     else
 | |
|         *dst += val;
 | |
| }
 | |
| 
 | |
| static void
 | |
| xmlSaturatedAddSizeT(unsigned long *dst, unsigned long val) {
 | |
|     if (val > ULONG_MAX - *dst)
 | |
|         *dst = ULONG_MAX;
 | |
|     else
 | |
|         *dst += val;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParserEntityCheck:
 | |
|  * @ctxt:  parser context
 | |
|  * @extra:  sum of unexpanded entity sizes
 | |
|  *
 | |
|  * Check for non-linear entity expansion behaviour.
 | |
|  *
 | |
|  * In some cases like xmlStringDecodeEntities, this function is called
 | |
|  * for each, possibly nested entity and its unexpanded content length.
 | |
|  *
 | |
|  * In other cases like xmlParseReference, it's only called for each
 | |
|  * top-level entity with its unexpanded content length plus the sum of
 | |
|  * the unexpanded content lengths (plus fixed cost) of all nested
 | |
|  * entities.
 | |
|  *
 | |
|  * Summing the unexpanded lengths also adds the length of the reference.
 | |
|  * This is by design. Taking the length of the entity name into account
 | |
|  * discourages attacks that try to waste CPU time with abusively long
 | |
|  * entity names. See test/recurse/lol6.xml for example. Each call also
 | |
|  * adds some fixed cost XML_ENT_FIXED_COST to discourage attacks with
 | |
|  * short entities.
 | |
|  *
 | |
|  * Returns 1 on error, 0 on success.
 | |
|  */
 | |
| static int
 | |
| xmlParserEntityCheck(xmlParserCtxtPtr ctxt, unsigned long extra)
 | |
| {
 | |
|     unsigned long consumed;
 | |
|     xmlParserInputPtr input = ctxt->input;
 | |
|     xmlEntityPtr entity = input->entity;
 | |
| 
 | |
|     /*
 | |
|      * Compute total consumed bytes so far, including input streams of
 | |
|      * external entities.
 | |
|      */
 | |
|     consumed = input->parentConsumed;
 | |
|     if ((entity == NULL) ||
 | |
|         ((entity->etype == XML_EXTERNAL_PARAMETER_ENTITY) &&
 | |
|          ((entity->flags & XML_ENT_PARSED) == 0))) {
 | |
|         xmlSaturatedAdd(&consumed, input->consumed);
 | |
|         xmlSaturatedAddSizeT(&consumed, input->cur - input->base);
 | |
|     }
 | |
|     xmlSaturatedAdd(&consumed, ctxt->sizeentities);
 | |
| 
 | |
|     /*
 | |
|      * Add extra cost and some fixed cost.
 | |
|      */
 | |
|     xmlSaturatedAdd(&ctxt->sizeentcopy, extra);
 | |
|     xmlSaturatedAdd(&ctxt->sizeentcopy, XML_ENT_FIXED_COST);
 | |
| 
 | |
|     /*
 | |
|      * It's important to always use saturation arithmetic when tracking
 | |
|      * entity sizes to make the size checks reliable. If "sizeentcopy"
 | |
|      * overflows, we have to abort.
 | |
|      */
 | |
|     if ((ctxt->sizeentcopy > XML_PARSER_ALLOWED_EXPANSION) &&
 | |
|         ((ctxt->sizeentcopy >= ULONG_MAX) ||
 | |
|          (ctxt->sizeentcopy / ctxt->maxAmpl > consumed))) {
 | |
|         xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_LOOP,
 | |
|                        "Maximum entity amplification factor exceeded, see "
 | |
|                        "xmlCtxtSetMaxAmplification.\n");
 | |
|         xmlHaltParser(ctxt);
 | |
|         return(1);
 | |
|     }
 | |
| 
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		Library wide options					*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|   * xmlHasFeature:
 | |
|   * @feature: the feature to be examined
 | |
|   *
 | |
|   * Examines if the library has been compiled with a given feature.
 | |
|   *
 | |
|   * Returns a non-zero value if the feature exist, otherwise zero.
 | |
|   * Returns zero (0) if the feature does not exist or an unknown
 | |
|   * unknown feature is requested, non-zero otherwise.
 | |
|   */
 | |
| int
 | |
| xmlHasFeature(xmlFeature feature)
 | |
| {
 | |
|     switch (feature) {
 | |
| 	case XML_WITH_THREAD:
 | |
| #ifdef LIBXML_THREAD_ENABLED
 | |
| 	    return(1);
 | |
| #else
 | |
| 	    return(0);
 | |
| #endif
 | |
|         case XML_WITH_TREE:
 | |
| #ifdef LIBXML_TREE_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_OUTPUT:
 | |
| #ifdef LIBXML_OUTPUT_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_PUSH:
 | |
| #ifdef LIBXML_PUSH_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_READER:
 | |
| #ifdef LIBXML_READER_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_PATTERN:
 | |
| #ifdef LIBXML_PATTERN_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_WRITER:
 | |
| #ifdef LIBXML_WRITER_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_SAX1:
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_FTP:
 | |
| #ifdef LIBXML_FTP_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_HTTP:
 | |
| #ifdef LIBXML_HTTP_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_VALID:
 | |
| #ifdef LIBXML_VALID_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_HTML:
 | |
| #ifdef LIBXML_HTML_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_LEGACY:
 | |
| #ifdef LIBXML_LEGACY_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_C14N:
 | |
| #ifdef LIBXML_C14N_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_CATALOG:
 | |
| #ifdef LIBXML_CATALOG_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_XPATH:
 | |
| #ifdef LIBXML_XPATH_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_XPTR:
 | |
| #ifdef LIBXML_XPTR_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_XINCLUDE:
 | |
| #ifdef LIBXML_XINCLUDE_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_ICONV:
 | |
| #ifdef LIBXML_ICONV_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_ISO8859X:
 | |
| #ifdef LIBXML_ISO8859X_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_UNICODE:
 | |
| #ifdef LIBXML_UNICODE_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_REGEXP:
 | |
| #ifdef LIBXML_REGEXP_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_AUTOMATA:
 | |
| #ifdef LIBXML_AUTOMATA_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_EXPR:
 | |
| #ifdef LIBXML_EXPR_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_SCHEMAS:
 | |
| #ifdef LIBXML_SCHEMAS_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_SCHEMATRON:
 | |
| #ifdef LIBXML_SCHEMATRON_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_MODULES:
 | |
| #ifdef LIBXML_MODULES_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_DEBUG:
 | |
| #ifdef LIBXML_DEBUG_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_DEBUG_MEM:
 | |
| #ifdef DEBUG_MEMORY_LOCATION
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_DEBUG_RUN:
 | |
|             return(0);
 | |
|         case XML_WITH_ZLIB:
 | |
| #ifdef LIBXML_ZLIB_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_LZMA:
 | |
| #ifdef LIBXML_LZMA_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         case XML_WITH_ICU:
 | |
| #ifdef LIBXML_ICU_ENABLED
 | |
|             return(1);
 | |
| #else
 | |
|             return(0);
 | |
| #endif
 | |
|         default:
 | |
| 	    break;
 | |
|      }
 | |
|      return(0);
 | |
| }
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		SAX2 defaulted attributes handling			*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * xmlDetectSAX2:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * Do the SAX2 detection and specific initialization
 | |
|  */
 | |
| static void
 | |
| xmlDetectSAX2(xmlParserCtxtPtr ctxt) {
 | |
|     xmlSAXHandlerPtr sax;
 | |
| 
 | |
|     /* Avoid unused variable warning if features are disabled. */
 | |
|     (void) sax;
 | |
| 
 | |
|     if (ctxt == NULL) return;
 | |
|     sax = ctxt->sax;
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
|     if ((sax) && (sax->initialized == XML_SAX2_MAGIC))
 | |
|         ctxt->sax2 = 1;
 | |
| #else
 | |
|     ctxt->sax2 = 1;
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
| 
 | |
|     ctxt->str_xml = xmlDictLookup(ctxt->dict, BAD_CAST "xml", 3);
 | |
|     ctxt->str_xmlns = xmlDictLookup(ctxt->dict, BAD_CAST "xmlns", 5);
 | |
|     ctxt->str_xml_ns = xmlDictLookup(ctxt->dict, XML_XML_NAMESPACE, 36);
 | |
|     if ((ctxt->str_xml==NULL) || (ctxt->str_xmlns==NULL) ||
 | |
| 		(ctxt->str_xml_ns == NULL)) {
 | |
|         xmlErrMemory(ctxt, NULL);
 | |
|     }
 | |
| }
 | |
| 
 | |
| typedef struct {
 | |
|     xmlHashedString prefix;
 | |
|     xmlHashedString name;
 | |
|     xmlHashedString value;
 | |
|     const xmlChar *valueEnd;
 | |
|     int external;
 | |
|     int expandedSize;
 | |
| } xmlDefAttr;
 | |
| 
 | |
| typedef struct _xmlDefAttrs xmlDefAttrs;
 | |
| typedef xmlDefAttrs *xmlDefAttrsPtr;
 | |
| struct _xmlDefAttrs {
 | |
|     int nbAttrs;	/* number of defaulted attributes on that element */
 | |
|     int maxAttrs;       /* the size of the array */
 | |
| #if __STDC_VERSION__ >= 199901L
 | |
|     /* Using a C99 flexible array member avoids UBSan errors. */
 | |
|     xmlDefAttr attrs[]; /* array of localname/prefix/values/external */
 | |
| #else
 | |
|     xmlDefAttr attrs[1];
 | |
| #endif
 | |
| };
 | |
| 
 | |
| /**
 | |
|  * xmlAttrNormalizeSpace:
 | |
|  * @src: the source string
 | |
|  * @dst: the target string
 | |
|  *
 | |
|  * Normalize the space in non CDATA attribute values:
 | |
|  * If the attribute type is not CDATA, then the XML processor MUST further
 | |
|  * process the normalized attribute value by discarding any leading and
 | |
|  * trailing space (#x20) characters, and by replacing sequences of space
 | |
|  * (#x20) characters by a single space (#x20) character.
 | |
|  * Note that the size of dst need to be at least src, and if one doesn't need
 | |
|  * to preserve dst (and it doesn't come from a dictionary or read-only) then
 | |
|  * passing src as dst is just fine.
 | |
|  *
 | |
|  * Returns a pointer to the normalized value (dst) or NULL if no conversion
 | |
|  *         is needed.
 | |
|  */
 | |
| static xmlChar *
 | |
| xmlAttrNormalizeSpace(const xmlChar *src, xmlChar *dst)
 | |
| {
 | |
|     if ((src == NULL) || (dst == NULL))
 | |
|         return(NULL);
 | |
| 
 | |
|     while (*src == 0x20) src++;
 | |
|     while (*src != 0) {
 | |
| 	if (*src == 0x20) {
 | |
| 	    while (*src == 0x20) src++;
 | |
| 	    if (*src != 0)
 | |
| 		*dst++ = 0x20;
 | |
| 	} else {
 | |
| 	    *dst++ = *src++;
 | |
| 	}
 | |
|     }
 | |
|     *dst = 0;
 | |
|     if (dst == src)
 | |
|        return(NULL);
 | |
|     return(dst);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlAttrNormalizeSpace2:
 | |
|  * @src: the source string
 | |
|  *
 | |
|  * Normalize the space in non CDATA attribute values, a slightly more complex
 | |
|  * front end to avoid allocation problems when running on attribute values
 | |
|  * coming from the input.
 | |
|  *
 | |
|  * Returns a pointer to the normalized value (dst) or NULL if no conversion
 | |
|  *         is needed.
 | |
|  */
 | |
| static const xmlChar *
 | |
| xmlAttrNormalizeSpace2(xmlParserCtxtPtr ctxt, xmlChar *src, int *len)
 | |
| {
 | |
|     int i;
 | |
|     int remove_head = 0;
 | |
|     int need_realloc = 0;
 | |
|     const xmlChar *cur;
 | |
| 
 | |
|     if ((ctxt == NULL) || (src == NULL) || (len == NULL))
 | |
|         return(NULL);
 | |
|     i = *len;
 | |
|     if (i <= 0)
 | |
|         return(NULL);
 | |
| 
 | |
|     cur = src;
 | |
|     while (*cur == 0x20) {
 | |
|         cur++;
 | |
| 	remove_head++;
 | |
|     }
 | |
|     while (*cur != 0) {
 | |
| 	if (*cur == 0x20) {
 | |
| 	    cur++;
 | |
| 	    if ((*cur == 0x20) || (*cur == 0)) {
 | |
| 	        need_realloc = 1;
 | |
| 		break;
 | |
| 	    }
 | |
| 	} else
 | |
| 	    cur++;
 | |
|     }
 | |
|     if (need_realloc) {
 | |
|         xmlChar *ret;
 | |
| 
 | |
| 	ret = xmlStrndup(src + remove_head, i - remove_head + 1);
 | |
| 	if (ret == NULL) {
 | |
| 	    xmlErrMemory(ctxt, NULL);
 | |
| 	    return(NULL);
 | |
| 	}
 | |
| 	xmlAttrNormalizeSpace(ret, ret);
 | |
| 	*len = strlen((const char *)ret);
 | |
|         return(ret);
 | |
|     } else if (remove_head) {
 | |
|         *len -= remove_head;
 | |
|         memmove(src, src + remove_head, 1 + *len);
 | |
| 	return(src);
 | |
|     }
 | |
|     return(NULL);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlAddDefAttrs:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @fullname:  the element fullname
 | |
|  * @fullattr:  the attribute fullname
 | |
|  * @value:  the attribute value
 | |
|  *
 | |
|  * Add a defaulted attribute for an element
 | |
|  */
 | |
| static void
 | |
| xmlAddDefAttrs(xmlParserCtxtPtr ctxt,
 | |
|                const xmlChar *fullname,
 | |
|                const xmlChar *fullattr,
 | |
|                const xmlChar *value) {
 | |
|     xmlDefAttrsPtr defaults;
 | |
|     xmlDefAttr *attr;
 | |
|     int len, expandedSize;
 | |
|     xmlHashedString name;
 | |
|     xmlHashedString prefix;
 | |
|     xmlHashedString hvalue;
 | |
|     const xmlChar *localname;
 | |
| 
 | |
|     /*
 | |
|      * Allows to detect attribute redefinitions
 | |
|      */
 | |
|     if (ctxt->attsSpecial != NULL) {
 | |
|         if (xmlHashLookup2(ctxt->attsSpecial, fullname, fullattr) != NULL)
 | |
| 	    return;
 | |
|     }
 | |
| 
 | |
|     if (ctxt->attsDefault == NULL) {
 | |
|         ctxt->attsDefault = xmlHashCreateDict(10, ctxt->dict);
 | |
| 	if (ctxt->attsDefault == NULL)
 | |
| 	    goto mem_error;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * split the element name into prefix:localname , the string found
 | |
|      * are within the DTD and then not associated to namespace names.
 | |
|      */
 | |
|     localname = xmlSplitQName3(fullname, &len);
 | |
|     if (localname == NULL) {
 | |
|         name = xmlDictLookupHashed(ctxt->dict, fullname, -1);
 | |
| 	prefix.name = NULL;
 | |
|     } else {
 | |
|         name = xmlDictLookupHashed(ctxt->dict, localname, -1);
 | |
| 	prefix = xmlDictLookupHashed(ctxt->dict, fullname, len);
 | |
|         if (prefix.name == NULL)
 | |
|             goto mem_error;
 | |
|     }
 | |
|     if (name.name == NULL)
 | |
|         goto mem_error;
 | |
| 
 | |
|     /*
 | |
|      * make sure there is some storage
 | |
|      */
 | |
|     defaults = xmlHashLookup2(ctxt->attsDefault, name.name, prefix.name);
 | |
|     if ((defaults == NULL) ||
 | |
|         (defaults->nbAttrs >= defaults->maxAttrs)) {
 | |
|         xmlDefAttrsPtr temp;
 | |
|         int newSize;
 | |
| 
 | |
|         newSize = (defaults != NULL) ? 2 * defaults->maxAttrs : 4;
 | |
|         temp = xmlRealloc(defaults,
 | |
|                           sizeof(*defaults) + newSize * sizeof(xmlDefAttr));
 | |
| 	if (temp == NULL)
 | |
| 	    goto mem_error;
 | |
|         if (defaults == NULL)
 | |
|             temp->nbAttrs = 0;
 | |
| 	temp->maxAttrs = newSize;
 | |
|         defaults = temp;
 | |
| 	if (xmlHashUpdateEntry2(ctxt->attsDefault, name.name, prefix.name,
 | |
| 	                        defaults, NULL) < 0) {
 | |
| 	    xmlFree(defaults);
 | |
| 	    goto mem_error;
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Split the attribute name into prefix:localname , the string found
 | |
|      * are within the DTD and hen not associated to namespace names.
 | |
|      */
 | |
|     localname = xmlSplitQName3(fullattr, &len);
 | |
|     if (localname == NULL) {
 | |
|         name = xmlDictLookupHashed(ctxt->dict, fullattr, -1);
 | |
| 	prefix.name = NULL;
 | |
|     } else {
 | |
|         name = xmlDictLookupHashed(ctxt->dict, localname, -1);
 | |
| 	prefix = xmlDictLookupHashed(ctxt->dict, fullattr, len);
 | |
|         if (prefix.name == NULL)
 | |
|             goto mem_error;
 | |
|     }
 | |
|     if (name.name == NULL)
 | |
|         goto mem_error;
 | |
| 
 | |
|     /* intern the string and precompute the end */
 | |
|     len = strlen((const char *) value);
 | |
|     hvalue = xmlDictLookupHashed(ctxt->dict, value, len);
 | |
|     if (hvalue.name == NULL)
 | |
|         goto mem_error;
 | |
| 
 | |
|     expandedSize = strlen((const char *) name.name);
 | |
|     if (prefix.name != NULL)
 | |
|         expandedSize += strlen((const char *) prefix.name);
 | |
|     expandedSize += len;
 | |
| 
 | |
|     attr = &defaults->attrs[defaults->nbAttrs++];
 | |
|     attr->name = name;
 | |
|     attr->prefix = prefix;
 | |
|     attr->value = hvalue;
 | |
|     attr->valueEnd = hvalue.name + len;
 | |
|     attr->external = ctxt->external;
 | |
|     attr->expandedSize = expandedSize;
 | |
| 
 | |
|     return;
 | |
| 
 | |
| mem_error:
 | |
|     xmlErrMemory(ctxt, NULL);
 | |
|     return;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlAddSpecialAttr:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @fullname:  the element fullname
 | |
|  * @fullattr:  the attribute fullname
 | |
|  * @type:  the attribute type
 | |
|  *
 | |
|  * Register this attribute type
 | |
|  */
 | |
| static void
 | |
| xmlAddSpecialAttr(xmlParserCtxtPtr ctxt,
 | |
| 		  const xmlChar *fullname,
 | |
| 		  const xmlChar *fullattr,
 | |
| 		  int type)
 | |
| {
 | |
|     if (ctxt->attsSpecial == NULL) {
 | |
|         ctxt->attsSpecial = xmlHashCreateDict(10, ctxt->dict);
 | |
| 	if (ctxt->attsSpecial == NULL)
 | |
| 	    goto mem_error;
 | |
|     }
 | |
| 
 | |
|     if (xmlHashLookup2(ctxt->attsSpecial, fullname, fullattr) != NULL)
 | |
|         return;
 | |
| 
 | |
|     xmlHashAddEntry2(ctxt->attsSpecial, fullname, fullattr,
 | |
|                      (void *) (ptrdiff_t) type);
 | |
|     return;
 | |
| 
 | |
| mem_error:
 | |
|     xmlErrMemory(ctxt, NULL);
 | |
|     return;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCleanSpecialAttrCallback:
 | |
|  *
 | |
|  * Removes CDATA attributes from the special attribute table
 | |
|  */
 | |
| static void
 | |
| xmlCleanSpecialAttrCallback(void *payload, void *data,
 | |
|                             const xmlChar *fullname, const xmlChar *fullattr,
 | |
|                             const xmlChar *unused ATTRIBUTE_UNUSED) {
 | |
|     xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) data;
 | |
| 
 | |
|     if (((ptrdiff_t) payload) == XML_ATTRIBUTE_CDATA) {
 | |
|         xmlHashRemoveEntry2(ctxt->attsSpecial, fullname, fullattr, NULL);
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCleanSpecialAttr:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * Trim the list of attributes defined to remove all those of type
 | |
|  * CDATA as they are not special. This call should be done when finishing
 | |
|  * to parse the DTD and before starting to parse the document root.
 | |
|  */
 | |
| static void
 | |
| xmlCleanSpecialAttr(xmlParserCtxtPtr ctxt)
 | |
| {
 | |
|     if (ctxt->attsSpecial == NULL)
 | |
|         return;
 | |
| 
 | |
|     xmlHashScanFull(ctxt->attsSpecial, xmlCleanSpecialAttrCallback, ctxt);
 | |
| 
 | |
|     if (xmlHashSize(ctxt->attsSpecial) == 0) {
 | |
|         xmlHashFree(ctxt->attsSpecial, NULL);
 | |
|         ctxt->attsSpecial = NULL;
 | |
|     }
 | |
|     return;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCheckLanguageID:
 | |
|  * @lang:  pointer to the string value
 | |
|  *
 | |
|  * DEPRECATED: Internal function, do not use.
 | |
|  *
 | |
|  * Checks that the value conforms to the LanguageID production:
 | |
|  *
 | |
|  * NOTE: this is somewhat deprecated, those productions were removed from
 | |
|  *       the XML Second edition.
 | |
|  *
 | |
|  * [33] LanguageID ::= Langcode ('-' Subcode)*
 | |
|  * [34] Langcode ::= ISO639Code |  IanaCode |  UserCode
 | |
|  * [35] ISO639Code ::= ([a-z] | [A-Z]) ([a-z] | [A-Z])
 | |
|  * [36] IanaCode ::= ('i' | 'I') '-' ([a-z] | [A-Z])+
 | |
|  * [37] UserCode ::= ('x' | 'X') '-' ([a-z] | [A-Z])+
 | |
|  * [38] Subcode ::= ([a-z] | [A-Z])+
 | |
|  *
 | |
|  * The current REC reference the successors of RFC 1766, currently 5646
 | |
|  *
 | |
|  * http://www.rfc-editor.org/rfc/rfc5646.txt
 | |
|  * langtag       = language
 | |
|  *                 ["-" script]
 | |
|  *                 ["-" region]
 | |
|  *                 *("-" variant)
 | |
|  *                 *("-" extension)
 | |
|  *                 ["-" privateuse]
 | |
|  * language      = 2*3ALPHA            ; shortest ISO 639 code
 | |
|  *                 ["-" extlang]       ; sometimes followed by
 | |
|  *                                     ; extended language subtags
 | |
|  *               / 4ALPHA              ; or reserved for future use
 | |
|  *               / 5*8ALPHA            ; or registered language subtag
 | |
|  *
 | |
|  * extlang       = 3ALPHA              ; selected ISO 639 codes
 | |
|  *                 *2("-" 3ALPHA)      ; permanently reserved
 | |
|  *
 | |
|  * script        = 4ALPHA              ; ISO 15924 code
 | |
|  *
 | |
|  * region        = 2ALPHA              ; ISO 3166-1 code
 | |
|  *               / 3DIGIT              ; UN M.49 code
 | |
|  *
 | |
|  * variant       = 5*8alphanum         ; registered variants
 | |
|  *               / (DIGIT 3alphanum)
 | |
|  *
 | |
|  * extension     = singleton 1*("-" (2*8alphanum))
 | |
|  *
 | |
|  *                                     ; Single alphanumerics
 | |
|  *                                     ; "x" reserved for private use
 | |
|  * singleton     = DIGIT               ; 0 - 9
 | |
|  *               / %x41-57             ; A - W
 | |
|  *               / %x59-5A             ; Y - Z
 | |
|  *               / %x61-77             ; a - w
 | |
|  *               / %x79-7A             ; y - z
 | |
|  *
 | |
|  * it sounds right to still allow Irregular i-xxx IANA and user codes too
 | |
|  * The parser below doesn't try to cope with extension or privateuse
 | |
|  * that could be added but that's not interoperable anyway
 | |
|  *
 | |
|  * Returns 1 if correct 0 otherwise
 | |
|  **/
 | |
| int
 | |
| xmlCheckLanguageID(const xmlChar * lang)
 | |
| {
 | |
|     const xmlChar *cur = lang, *nxt;
 | |
| 
 | |
|     if (cur == NULL)
 | |
|         return (0);
 | |
|     if (((cur[0] == 'i') && (cur[1] == '-')) ||
 | |
|         ((cur[0] == 'I') && (cur[1] == '-')) ||
 | |
|         ((cur[0] == 'x') && (cur[1] == '-')) ||
 | |
|         ((cur[0] == 'X') && (cur[1] == '-'))) {
 | |
|         /*
 | |
|          * Still allow IANA code and user code which were coming
 | |
|          * from the previous version of the XML-1.0 specification
 | |
|          * it's deprecated but we should not fail
 | |
|          */
 | |
|         cur += 2;
 | |
|         while (((cur[0] >= 'A') && (cur[0] <= 'Z')) ||
 | |
|                ((cur[0] >= 'a') && (cur[0] <= 'z')))
 | |
|             cur++;
 | |
|         return(cur[0] == 0);
 | |
|     }
 | |
|     nxt = cur;
 | |
|     while (((nxt[0] >= 'A') && (nxt[0] <= 'Z')) ||
 | |
|            ((nxt[0] >= 'a') && (nxt[0] <= 'z')))
 | |
|            nxt++;
 | |
|     if (nxt - cur >= 4) {
 | |
|         /*
 | |
|          * Reserved
 | |
|          */
 | |
|         if ((nxt - cur > 8) || (nxt[0] != 0))
 | |
|             return(0);
 | |
|         return(1);
 | |
|     }
 | |
|     if (nxt - cur < 2)
 | |
|         return(0);
 | |
|     /* we got an ISO 639 code */
 | |
|     if (nxt[0] == 0)
 | |
|         return(1);
 | |
|     if (nxt[0] != '-')
 | |
|         return(0);
 | |
| 
 | |
|     nxt++;
 | |
|     cur = nxt;
 | |
|     /* now we can have extlang or script or region or variant */
 | |
|     if ((nxt[0] >= '0') && (nxt[0] <= '9'))
 | |
|         goto region_m49;
 | |
| 
 | |
|     while (((nxt[0] >= 'A') && (nxt[0] <= 'Z')) ||
 | |
|            ((nxt[0] >= 'a') && (nxt[0] <= 'z')))
 | |
|            nxt++;
 | |
|     if (nxt - cur == 4)
 | |
|         goto script;
 | |
|     if (nxt - cur == 2)
 | |
|         goto region;
 | |
|     if ((nxt - cur >= 5) && (nxt - cur <= 8))
 | |
|         goto variant;
 | |
|     if (nxt - cur != 3)
 | |
|         return(0);
 | |
|     /* we parsed an extlang */
 | |
|     if (nxt[0] == 0)
 | |
|         return(1);
 | |
|     if (nxt[0] != '-')
 | |
|         return(0);
 | |
| 
 | |
|     nxt++;
 | |
|     cur = nxt;
 | |
|     /* now we can have script or region or variant */
 | |
|     if ((nxt[0] >= '0') && (nxt[0] <= '9'))
 | |
|         goto region_m49;
 | |
| 
 | |
|     while (((nxt[0] >= 'A') && (nxt[0] <= 'Z')) ||
 | |
|            ((nxt[0] >= 'a') && (nxt[0] <= 'z')))
 | |
|            nxt++;
 | |
|     if (nxt - cur == 2)
 | |
|         goto region;
 | |
|     if ((nxt - cur >= 5) && (nxt - cur <= 8))
 | |
|         goto variant;
 | |
|     if (nxt - cur != 4)
 | |
|         return(0);
 | |
|     /* we parsed a script */
 | |
| script:
 | |
|     if (nxt[0] == 0)
 | |
|         return(1);
 | |
|     if (nxt[0] != '-')
 | |
|         return(0);
 | |
| 
 | |
|     nxt++;
 | |
|     cur = nxt;
 | |
|     /* now we can have region or variant */
 | |
|     if ((nxt[0] >= '0') && (nxt[0] <= '9'))
 | |
|         goto region_m49;
 | |
| 
 | |
|     while (((nxt[0] >= 'A') && (nxt[0] <= 'Z')) ||
 | |
|            ((nxt[0] >= 'a') && (nxt[0] <= 'z')))
 | |
|            nxt++;
 | |
| 
 | |
|     if ((nxt - cur >= 5) && (nxt - cur <= 8))
 | |
|         goto variant;
 | |
|     if (nxt - cur != 2)
 | |
|         return(0);
 | |
|     /* we parsed a region */
 | |
| region:
 | |
|     if (nxt[0] == 0)
 | |
|         return(1);
 | |
|     if (nxt[0] != '-')
 | |
|         return(0);
 | |
| 
 | |
|     nxt++;
 | |
|     cur = nxt;
 | |
|     /* now we can just have a variant */
 | |
|     while (((nxt[0] >= 'A') && (nxt[0] <= 'Z')) ||
 | |
|            ((nxt[0] >= 'a') && (nxt[0] <= 'z')))
 | |
|            nxt++;
 | |
| 
 | |
|     if ((nxt - cur < 5) || (nxt - cur > 8))
 | |
|         return(0);
 | |
| 
 | |
|     /* we parsed a variant */
 | |
| variant:
 | |
|     if (nxt[0] == 0)
 | |
|         return(1);
 | |
|     if (nxt[0] != '-')
 | |
|         return(0);
 | |
|     /* extensions and private use subtags not checked */
 | |
|     return (1);
 | |
| 
 | |
| region_m49:
 | |
|     if (((nxt[1] >= '0') && (nxt[1] <= '9')) &&
 | |
|         ((nxt[2] >= '0') && (nxt[2] <= '9'))) {
 | |
|         nxt += 3;
 | |
|         goto region;
 | |
|     }
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		Parser stacks related functions and macros		*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| static xmlEntityPtr xmlParseStringEntityRef(xmlParserCtxtPtr ctxt,
 | |
|                                             const xmlChar ** str);
 | |
| 
 | |
| /**
 | |
|  * xmlParserNsCreate:
 | |
|  *
 | |
|  * Create a new namespace database.
 | |
|  *
 | |
|  * Returns the new obejct.
 | |
|  */
 | |
| xmlParserNsData *
 | |
| xmlParserNsCreate(void) {
 | |
|     xmlParserNsData *nsdb = xmlMalloc(sizeof(*nsdb));
 | |
| 
 | |
|     if (nsdb == NULL)
 | |
|         return(NULL);
 | |
|     memset(nsdb, 0, sizeof(*nsdb));
 | |
|     nsdb->defaultNsIndex = INT_MAX;
 | |
| 
 | |
|     return(nsdb);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParserNsFree:
 | |
|  * @nsdb: namespace database
 | |
|  *
 | |
|  * Free a namespace database.
 | |
|  */
 | |
| void
 | |
| xmlParserNsFree(xmlParserNsData *nsdb) {
 | |
|     if (nsdb == NULL)
 | |
|         return;
 | |
| 
 | |
|     xmlFree(nsdb->extra);
 | |
|     xmlFree(nsdb->hash);
 | |
|     xmlFree(nsdb);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParserNsReset:
 | |
|  * @nsdb: namespace database
 | |
|  *
 | |
|  * Reset a namespace database.
 | |
|  */
 | |
| static void
 | |
| xmlParserNsReset(xmlParserNsData *nsdb) {
 | |
|     if (nsdb == NULL)
 | |
|         return;
 | |
| 
 | |
|     nsdb->hashElems = 0;
 | |
|     nsdb->elementId = 0;
 | |
|     nsdb->defaultNsIndex = INT_MAX;
 | |
| 
 | |
|     if (nsdb->hash)
 | |
|         memset(nsdb->hash, 0, nsdb->hashSize * sizeof(nsdb->hash[0]));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParserStartElement:
 | |
|  * @nsdb: namespace database
 | |
|  *
 | |
|  * Signal that a new element has started.
 | |
|  *
 | |
|  * Returns 0 on success, -1 if the element counter overflowed.
 | |
|  */
 | |
| static int
 | |
| xmlParserNsStartElement(xmlParserNsData *nsdb) {
 | |
|     if (nsdb->elementId == UINT_MAX)
 | |
|         return(-1);
 | |
|     nsdb->elementId++;
 | |
| 
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParserNsLookup:
 | |
|  * @ctxt: parser context
 | |
|  * @prefix: namespace prefix
 | |
|  * @bucketPtr: optional bucket (return value)
 | |
|  *
 | |
|  * Lookup namespace with given prefix. If @bucketPtr is non-NULL, it will
 | |
|  * be set to the matching bucket, or the first empty bucket if no match
 | |
|  * was found.
 | |
|  *
 | |
|  * Returns the namespace index on success, INT_MAX if no namespace was
 | |
|  * found.
 | |
|  */
 | |
| static int
 | |
| xmlParserNsLookup(xmlParserCtxtPtr ctxt, const xmlHashedString *prefix,
 | |
|                   xmlParserNsBucket **bucketPtr) {
 | |
|     xmlParserNsBucket *bucket;
 | |
|     unsigned index, hashValue;
 | |
| 
 | |
|     if (prefix->name == NULL)
 | |
|         return(ctxt->nsdb->defaultNsIndex);
 | |
| 
 | |
|     if (ctxt->nsdb->hashSize == 0)
 | |
|         return(INT_MAX);
 | |
| 
 | |
|     hashValue = prefix->hashValue;
 | |
|     index = hashValue & (ctxt->nsdb->hashSize - 1);
 | |
|     bucket = &ctxt->nsdb->hash[index];
 | |
| 
 | |
|     while (bucket->hashValue) {
 | |
|         if ((bucket->hashValue == hashValue) &&
 | |
|             (bucket->index != INT_MAX)) {
 | |
|             if (ctxt->nsTab[bucket->index * 2] == prefix->name) {
 | |
|                 if (bucketPtr != NULL)
 | |
|                     *bucketPtr = bucket;
 | |
|                 return(bucket->index);
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         index++;
 | |
|         bucket++;
 | |
|         if (index == ctxt->nsdb->hashSize) {
 | |
|             index = 0;
 | |
|             bucket = ctxt->nsdb->hash;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     if (bucketPtr != NULL)
 | |
|         *bucketPtr = bucket;
 | |
|     return(INT_MAX);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParserNsLookupUri:
 | |
|  * @ctxt: parser context
 | |
|  * @prefix: namespace prefix
 | |
|  *
 | |
|  * Lookup namespace URI with given prefix.
 | |
|  *
 | |
|  * Returns the namespace URI on success, NULL if no namespace was found.
 | |
|  */
 | |
| static const xmlChar *
 | |
| xmlParserNsLookupUri(xmlParserCtxtPtr ctxt, const xmlHashedString *prefix) {
 | |
|     const xmlChar *ret;
 | |
|     int nsIndex;
 | |
| 
 | |
|     if (prefix->name == ctxt->str_xml)
 | |
|         return(ctxt->str_xml_ns);
 | |
| 
 | |
|     nsIndex = xmlParserNsLookup(ctxt, prefix, NULL);
 | |
|     if (nsIndex == INT_MAX)
 | |
|         return(NULL);
 | |
| 
 | |
|     ret = ctxt->nsTab[nsIndex * 2 + 1];
 | |
|     if (ret[0] == 0)
 | |
|         ret = NULL;
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParserNsLookupSax:
 | |
|  * @ctxt: parser context
 | |
|  * @prefix: namespace prefix
 | |
|  *
 | |
|  * Lookup extra data for the given prefix. This returns data stored
 | |
|  * with xmlParserNsUdpateSax.
 | |
|  *
 | |
|  * Returns the data on success, NULL if no namespace was found.
 | |
|  */
 | |
| void *
 | |
| xmlParserNsLookupSax(xmlParserCtxtPtr ctxt, const xmlChar *prefix) {
 | |
|     xmlHashedString hprefix;
 | |
|     int nsIndex;
 | |
| 
 | |
|     if (prefix == ctxt->str_xml)
 | |
|         return(NULL);
 | |
| 
 | |
|     hprefix.name = prefix;
 | |
|     if (prefix != NULL)
 | |
|         hprefix.hashValue = xmlDictComputeHash(ctxt->dict, prefix);
 | |
|     else
 | |
|         hprefix.hashValue = 0;
 | |
|     nsIndex = xmlParserNsLookup(ctxt, &hprefix, NULL);
 | |
|     if (nsIndex == INT_MAX)
 | |
|         return(NULL);
 | |
| 
 | |
|     return(ctxt->nsdb->extra[nsIndex].saxData);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParserNsUpdateSax:
 | |
|  * @ctxt: parser context
 | |
|  * @prefix: namespace prefix
 | |
|  * @saxData: extra data for SAX handler
 | |
|  *
 | |
|  * Sets or updates extra data for the given prefix. This value will be
 | |
|  * returned by xmlParserNsLookupSax as long as the namespace with the
 | |
|  * given prefix is in scope.
 | |
|  *
 | |
|  * Returns the data on success, NULL if no namespace was found.
 | |
|  */
 | |
| int
 | |
| xmlParserNsUpdateSax(xmlParserCtxtPtr ctxt, const xmlChar *prefix,
 | |
|                      void *saxData) {
 | |
|     xmlHashedString hprefix;
 | |
|     int nsIndex;
 | |
| 
 | |
|     if (prefix == ctxt->str_xml)
 | |
|         return(-1);
 | |
| 
 | |
|     hprefix.name = prefix;
 | |
|     if (prefix != NULL)
 | |
|         hprefix.hashValue = xmlDictComputeHash(ctxt->dict, prefix);
 | |
|     else
 | |
|         hprefix.hashValue = 0;
 | |
|     nsIndex = xmlParserNsLookup(ctxt, &hprefix, NULL);
 | |
|     if (nsIndex == INT_MAX)
 | |
|         return(-1);
 | |
| 
 | |
|     ctxt->nsdb->extra[nsIndex].saxData = saxData;
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParserNsGrow:
 | |
|  * @ctxt: parser context
 | |
|  *
 | |
|  * Grows the namespace tables.
 | |
|  *
 | |
|  * Returns 0 on success, -1 if a memory allocation failed.
 | |
|  */
 | |
| static int
 | |
| xmlParserNsGrow(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar **table;
 | |
|     xmlParserNsExtra *extra;
 | |
|     int newSize;
 | |
| 
 | |
|     if (ctxt->nsMax > INT_MAX / 2)
 | |
|         goto error;
 | |
|     newSize = ctxt->nsMax ? ctxt->nsMax * 2 : 16;
 | |
| 
 | |
|     table = xmlRealloc(ctxt->nsTab, 2 * newSize * sizeof(table[0]));
 | |
|     if (table == NULL)
 | |
|         goto error;
 | |
|     ctxt->nsTab = table;
 | |
| 
 | |
|     extra = xmlRealloc(ctxt->nsdb->extra, newSize * sizeof(extra[0]));
 | |
|     if (extra == NULL)
 | |
|         goto error;
 | |
|     ctxt->nsdb->extra = extra;
 | |
| 
 | |
|     ctxt->nsMax = newSize;
 | |
|     return(0);
 | |
| 
 | |
| error:
 | |
|     xmlErrMemory(ctxt, NULL);
 | |
|     return(-1);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParserNsPush:
 | |
|  * @ctxt: parser context
 | |
|  * @prefix: prefix with hash value
 | |
|  * @uri: uri with hash value
 | |
|  * @saxData: extra data for SAX handler
 | |
|  * @defAttr: whether the namespace comes from a default attribute
 | |
|  *
 | |
|  * Push a new namespace on the table.
 | |
|  *
 | |
|  * Returns 1 if the namespace was pushed, 0 if the namespace was ignored,
 | |
|  * -1 if a memory allocation failed.
 | |
|  */
 | |
| static int
 | |
| xmlParserNsPush(xmlParserCtxtPtr ctxt, const xmlHashedString *prefix,
 | |
|                 const xmlHashedString *uri, void *saxData, int defAttr) {
 | |
|     xmlParserNsBucket *bucket = NULL;
 | |
|     xmlParserNsExtra *extra;
 | |
|     const xmlChar **ns;
 | |
|     unsigned hashValue, nsIndex, oldIndex;
 | |
| 
 | |
|     if ((prefix != NULL) && (prefix->name == ctxt->str_xml))
 | |
|         return(0);
 | |
| 
 | |
|     if ((ctxt->nsNr >= ctxt->nsMax) && (xmlParserNsGrow(ctxt) < 0)) {
 | |
|         xmlErrMemory(ctxt, NULL);
 | |
|         return(-1);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Default namespace and 'xml' namespace
 | |
|      */
 | |
|     if ((prefix == NULL) || (prefix->name == NULL)) {
 | |
|         oldIndex = ctxt->nsdb->defaultNsIndex;
 | |
| 
 | |
|         if (oldIndex != INT_MAX) {
 | |
|             if (defAttr != 0)
 | |
|                 return(0);
 | |
| 
 | |
|             extra = &ctxt->nsdb->extra[oldIndex];
 | |
| 
 | |
|             if (extra->elementId == ctxt->nsdb->elementId) {
 | |
|                 xmlErrAttributeDup(ctxt, NULL, BAD_CAST "xmlns");
 | |
|                 return(0);
 | |
|             }
 | |
| 
 | |
|             if ((ctxt->options & XML_PARSE_NSCLEAN) &&
 | |
|                 (uri->name == ctxt->nsTab[oldIndex * 2 + 1]))
 | |
|                 return(0);
 | |
|         }
 | |
| 
 | |
|         ctxt->nsdb->defaultNsIndex = ctxt->nsNr;
 | |
|         goto populate_entry;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Hash table lookup
 | |
|      */
 | |
|     oldIndex = xmlParserNsLookup(ctxt, prefix, &bucket);
 | |
|     if (oldIndex != INT_MAX) {
 | |
|         extra = &ctxt->nsdb->extra[oldIndex];
 | |
| 
 | |
|         if (defAttr != 0)
 | |
|             return(0);
 | |
| 
 | |
|         /*
 | |
|          * Check for duplicate definitions on the same element.
 | |
|          */
 | |
|         if (extra->elementId == ctxt->nsdb->elementId) {
 | |
|             xmlErrAttributeDup(ctxt, BAD_CAST "xmlns", prefix->name);
 | |
|             return(0);
 | |
|         }
 | |
| 
 | |
|         if ((ctxt->options & XML_PARSE_NSCLEAN) &&
 | |
|             (uri->name == ctxt->nsTab[bucket->index * 2 + 1]))
 | |
|             return(0);
 | |
| 
 | |
|         bucket->index = ctxt->nsNr;
 | |
|         goto populate_entry;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Insert new bucket
 | |
|      */
 | |
| 
 | |
|     hashValue = prefix->hashValue;
 | |
| 
 | |
|     /*
 | |
|      * Grow hash table, 50% fill factor
 | |
|      */
 | |
|     if (ctxt->nsdb->hashElems + 1 > ctxt->nsdb->hashSize / 2) {
 | |
|         xmlParserNsBucket *newHash;
 | |
|         unsigned newSize, i, index;
 | |
| 
 | |
|         if (ctxt->nsdb->hashSize > UINT_MAX / 2) {
 | |
|             xmlErrMemory(ctxt, NULL);
 | |
|             return(-1);
 | |
|         }
 | |
|         newSize = ctxt->nsdb->hashSize ? ctxt->nsdb->hashSize * 2 : 16;
 | |
|         newHash = xmlMalloc(newSize * sizeof(newHash[0]));
 | |
|         if (newHash == NULL) {
 | |
|             xmlErrMemory(ctxt, NULL);
 | |
|             return(-1);
 | |
|         }
 | |
|         memset(newHash, 0, newSize * sizeof(newHash[0]));
 | |
| 
 | |
|         for (i = 0; i < ctxt->nsdb->hashSize; i++) {
 | |
|             unsigned hv = ctxt->nsdb->hash[i].hashValue;
 | |
|             unsigned newIndex;
 | |
| 
 | |
|             if (hv == 0)
 | |
|                 continue;
 | |
|             newIndex = hv & (newSize - 1);
 | |
| 
 | |
|             while (newHash[newIndex].hashValue != 0) {
 | |
|                 newIndex++;
 | |
|                 if (newIndex == newSize)
 | |
|                     newIndex = 0;
 | |
|             }
 | |
| 
 | |
|             newHash[newIndex] = ctxt->nsdb->hash[i];
 | |
|         }
 | |
| 
 | |
|         xmlFree(ctxt->nsdb->hash);
 | |
|         ctxt->nsdb->hash = newHash;
 | |
|         ctxt->nsdb->hashSize = newSize;
 | |
| 
 | |
|         /*
 | |
|          * Relookup
 | |
|          */
 | |
|         index = hashValue & (newSize - 1);
 | |
| 
 | |
|         while (newHash[index].hashValue != 0) {
 | |
|             index++;
 | |
|             if (index == newSize)
 | |
|                 index = 0;
 | |
|         }
 | |
| 
 | |
|         bucket = &newHash[index];
 | |
|     }
 | |
| 
 | |
|     bucket->hashValue = hashValue;
 | |
|     bucket->index = ctxt->nsNr;
 | |
|     ctxt->nsdb->hashElems++;
 | |
|     oldIndex = INT_MAX;
 | |
| 
 | |
| populate_entry:
 | |
|     nsIndex = ctxt->nsNr;
 | |
| 
 | |
|     ns = &ctxt->nsTab[nsIndex * 2];
 | |
|     ns[0] = prefix ? prefix->name : NULL;
 | |
|     ns[1] = uri->name;
 | |
| 
 | |
|     extra = &ctxt->nsdb->extra[nsIndex];
 | |
|     extra->saxData = saxData;
 | |
|     extra->prefixHashValue = prefix ? prefix->hashValue : 0;
 | |
|     extra->uriHashValue = uri->hashValue;
 | |
|     extra->elementId = ctxt->nsdb->elementId;
 | |
|     extra->oldIndex = oldIndex;
 | |
| 
 | |
|     ctxt->nsNr++;
 | |
| 
 | |
|     return(1);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParserNsPop:
 | |
|  * @ctxt: an XML parser context
 | |
|  * @nr:  the number to pop
 | |
|  *
 | |
|  * Pops the top @nr namespaces and restores the hash table.
 | |
|  *
 | |
|  * Returns the number of namespaces popped.
 | |
|  */
 | |
| static int
 | |
| xmlParserNsPop(xmlParserCtxtPtr ctxt, int nr)
 | |
| {
 | |
|     int i;
 | |
| 
 | |
|     /* assert(nr <= ctxt->nsNr); */
 | |
| 
 | |
|     for (i = ctxt->nsNr - 1; i >= ctxt->nsNr - nr; i--) {
 | |
|         const xmlChar *prefix = ctxt->nsTab[i * 2];
 | |
|         xmlParserNsExtra *extra = &ctxt->nsdb->extra[i];
 | |
| 
 | |
|         if (prefix == NULL) {
 | |
|             ctxt->nsdb->defaultNsIndex = extra->oldIndex;
 | |
|         } else {
 | |
|             xmlHashedString hprefix;
 | |
|             xmlParserNsBucket *bucket = NULL;
 | |
| 
 | |
|             hprefix.name = prefix;
 | |
|             hprefix.hashValue = extra->prefixHashValue;
 | |
|             xmlParserNsLookup(ctxt, &hprefix, &bucket);
 | |
|             /* assert(bucket && bucket->hashValue); */
 | |
|             bucket->index = extra->oldIndex;
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     ctxt->nsNr -= nr;
 | |
|     return(nr);
 | |
| }
 | |
| 
 | |
| static int
 | |
| xmlCtxtGrowAttrs(xmlParserCtxtPtr ctxt, int nr) {
 | |
|     const xmlChar **atts;
 | |
|     unsigned *attallocs;
 | |
|     int maxatts;
 | |
| 
 | |
|     if (nr + 5 > ctxt->maxatts) {
 | |
| 	maxatts = ctxt->maxatts == 0 ? 55 : (nr + 5) * 2;
 | |
| 	atts = (const xmlChar **) xmlMalloc(
 | |
| 				     maxatts * sizeof(const xmlChar *));
 | |
| 	if (atts == NULL) goto mem_error;
 | |
| 	attallocs = xmlRealloc(ctxt->attallocs,
 | |
|                                (maxatts / 5) * sizeof(attallocs[0]));
 | |
| 	if (attallocs == NULL) {
 | |
|             xmlFree(atts);
 | |
|             goto mem_error;
 | |
|         }
 | |
|         if (ctxt->maxatts > 0)
 | |
|             memcpy(atts, ctxt->atts, ctxt->maxatts * sizeof(const xmlChar *));
 | |
|         xmlFree(ctxt->atts);
 | |
| 	ctxt->atts = atts;
 | |
| 	ctxt->attallocs = attallocs;
 | |
| 	ctxt->maxatts = maxatts;
 | |
|     }
 | |
|     return(ctxt->maxatts);
 | |
| mem_error:
 | |
|     xmlErrMemory(ctxt, NULL);
 | |
|     return(-1);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * inputPush:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @value:  the parser input
 | |
|  *
 | |
|  * Pushes a new parser input on top of the input stack
 | |
|  *
 | |
|  * Returns -1 in case of error, the index in the stack otherwise
 | |
|  */
 | |
| int
 | |
| inputPush(xmlParserCtxtPtr ctxt, xmlParserInputPtr value)
 | |
| {
 | |
|     if ((ctxt == NULL) || (value == NULL))
 | |
|         return(-1);
 | |
|     if (ctxt->inputNr >= ctxt->inputMax) {
 | |
|         size_t newSize = ctxt->inputMax * 2;
 | |
|         xmlParserInputPtr *tmp;
 | |
| 
 | |
|         tmp = (xmlParserInputPtr *) xmlRealloc(ctxt->inputTab,
 | |
|                                                newSize * sizeof(*tmp));
 | |
|         if (tmp == NULL) {
 | |
|             xmlErrMemory(ctxt, NULL);
 | |
|             return (-1);
 | |
|         }
 | |
|         ctxt->inputTab = tmp;
 | |
|         ctxt->inputMax = newSize;
 | |
|     }
 | |
|     ctxt->inputTab[ctxt->inputNr] = value;
 | |
|     ctxt->input = value;
 | |
|     return (ctxt->inputNr++);
 | |
| }
 | |
| /**
 | |
|  * inputPop:
 | |
|  * @ctxt: an XML parser context
 | |
|  *
 | |
|  * Pops the top parser input from the input stack
 | |
|  *
 | |
|  * Returns the input just removed
 | |
|  */
 | |
| xmlParserInputPtr
 | |
| inputPop(xmlParserCtxtPtr ctxt)
 | |
| {
 | |
|     xmlParserInputPtr ret;
 | |
| 
 | |
|     if (ctxt == NULL)
 | |
|         return(NULL);
 | |
|     if (ctxt->inputNr <= 0)
 | |
|         return (NULL);
 | |
|     ctxt->inputNr--;
 | |
|     if (ctxt->inputNr > 0)
 | |
|         ctxt->input = ctxt->inputTab[ctxt->inputNr - 1];
 | |
|     else
 | |
|         ctxt->input = NULL;
 | |
|     ret = ctxt->inputTab[ctxt->inputNr];
 | |
|     ctxt->inputTab[ctxt->inputNr] = NULL;
 | |
|     return (ret);
 | |
| }
 | |
| /**
 | |
|  * nodePush:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @value:  the element node
 | |
|  *
 | |
|  * DEPRECATED: Internal function, do not use.
 | |
|  *
 | |
|  * Pushes a new element node on top of the node stack
 | |
|  *
 | |
|  * Returns -1 in case of error, the index in the stack otherwise
 | |
|  */
 | |
| int
 | |
| nodePush(xmlParserCtxtPtr ctxt, xmlNodePtr value)
 | |
| {
 | |
|     if (ctxt == NULL) return(0);
 | |
|     if (ctxt->nodeNr >= ctxt->nodeMax) {
 | |
|         xmlNodePtr *tmp;
 | |
| 
 | |
| 	tmp = (xmlNodePtr *) xmlRealloc(ctxt->nodeTab,
 | |
|                                       ctxt->nodeMax * 2 *
 | |
|                                       sizeof(ctxt->nodeTab[0]));
 | |
|         if (tmp == NULL) {
 | |
|             xmlErrMemory(ctxt, NULL);
 | |
|             return (-1);
 | |
|         }
 | |
|         ctxt->nodeTab = tmp;
 | |
| 	ctxt->nodeMax *= 2;
 | |
|     }
 | |
|     if ((((unsigned int) ctxt->nodeNr) > xmlParserMaxDepth) &&
 | |
|         ((ctxt->options & XML_PARSE_HUGE) == 0)) {
 | |
| 	xmlFatalErrMsgInt(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
| 		 "Excessive depth in document: %d use XML_PARSE_HUGE option\n",
 | |
| 			  xmlParserMaxDepth);
 | |
| 	xmlHaltParser(ctxt);
 | |
| 	return(-1);
 | |
|     }
 | |
|     ctxt->nodeTab[ctxt->nodeNr] = value;
 | |
|     ctxt->node = value;
 | |
|     return (ctxt->nodeNr++);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * nodePop:
 | |
|  * @ctxt: an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, do not use.
 | |
|  *
 | |
|  * Pops the top element node from the node stack
 | |
|  *
 | |
|  * Returns the node just removed
 | |
|  */
 | |
| xmlNodePtr
 | |
| nodePop(xmlParserCtxtPtr ctxt)
 | |
| {
 | |
|     xmlNodePtr ret;
 | |
| 
 | |
|     if (ctxt == NULL) return(NULL);
 | |
|     if (ctxt->nodeNr <= 0)
 | |
|         return (NULL);
 | |
|     ctxt->nodeNr--;
 | |
|     if (ctxt->nodeNr > 0)
 | |
|         ctxt->node = ctxt->nodeTab[ctxt->nodeNr - 1];
 | |
|     else
 | |
|         ctxt->node = NULL;
 | |
|     ret = ctxt->nodeTab[ctxt->nodeNr];
 | |
|     ctxt->nodeTab[ctxt->nodeNr] = NULL;
 | |
|     return (ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * nameNsPush:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @value:  the element name
 | |
|  * @prefix:  the element prefix
 | |
|  * @URI:  the element namespace name
 | |
|  * @line:  the current line number for error messages
 | |
|  * @nsNr:  the number of namespaces pushed on the namespace table
 | |
|  *
 | |
|  * Pushes a new element name/prefix/URL on top of the name stack
 | |
|  *
 | |
|  * Returns -1 in case of error, the index in the stack otherwise
 | |
|  */
 | |
| static int
 | |
| nameNsPush(xmlParserCtxtPtr ctxt, const xmlChar * value,
 | |
|            const xmlChar *prefix, const xmlChar *URI, int line, int nsNr)
 | |
| {
 | |
|     xmlStartTag *tag;
 | |
| 
 | |
|     if (ctxt->nameNr >= ctxt->nameMax) {
 | |
|         const xmlChar * *tmp;
 | |
|         xmlStartTag *tmp2;
 | |
|         ctxt->nameMax *= 2;
 | |
|         tmp = (const xmlChar * *) xmlRealloc((xmlChar * *)ctxt->nameTab,
 | |
|                                     ctxt->nameMax *
 | |
|                                     sizeof(ctxt->nameTab[0]));
 | |
|         if (tmp == NULL) {
 | |
| 	    ctxt->nameMax /= 2;
 | |
| 	    goto mem_error;
 | |
|         }
 | |
| 	ctxt->nameTab = tmp;
 | |
|         tmp2 = (xmlStartTag *) xmlRealloc((void * *)ctxt->pushTab,
 | |
|                                     ctxt->nameMax *
 | |
|                                     sizeof(ctxt->pushTab[0]));
 | |
|         if (tmp2 == NULL) {
 | |
| 	    ctxt->nameMax /= 2;
 | |
| 	    goto mem_error;
 | |
|         }
 | |
| 	ctxt->pushTab = tmp2;
 | |
|     } else if (ctxt->pushTab == NULL) {
 | |
|         ctxt->pushTab = (xmlStartTag *) xmlMalloc(ctxt->nameMax *
 | |
|                                             sizeof(ctxt->pushTab[0]));
 | |
|         if (ctxt->pushTab == NULL)
 | |
|             goto mem_error;
 | |
|     }
 | |
|     ctxt->nameTab[ctxt->nameNr] = value;
 | |
|     ctxt->name = value;
 | |
|     tag = &ctxt->pushTab[ctxt->nameNr];
 | |
|     tag->prefix = prefix;
 | |
|     tag->URI = URI;
 | |
|     tag->line = line;
 | |
|     tag->nsNr = nsNr;
 | |
|     return (ctxt->nameNr++);
 | |
| mem_error:
 | |
|     xmlErrMemory(ctxt, NULL);
 | |
|     return (-1);
 | |
| }
 | |
| #ifdef LIBXML_PUSH_ENABLED
 | |
| /**
 | |
|  * nameNsPop:
 | |
|  * @ctxt: an XML parser context
 | |
|  *
 | |
|  * Pops the top element/prefix/URI name from the name stack
 | |
|  *
 | |
|  * Returns the name just removed
 | |
|  */
 | |
| static const xmlChar *
 | |
| nameNsPop(xmlParserCtxtPtr ctxt)
 | |
| {
 | |
|     const xmlChar *ret;
 | |
| 
 | |
|     if (ctxt->nameNr <= 0)
 | |
|         return (NULL);
 | |
|     ctxt->nameNr--;
 | |
|     if (ctxt->nameNr > 0)
 | |
|         ctxt->name = ctxt->nameTab[ctxt->nameNr - 1];
 | |
|     else
 | |
|         ctxt->name = NULL;
 | |
|     ret = ctxt->nameTab[ctxt->nameNr];
 | |
|     ctxt->nameTab[ctxt->nameNr] = NULL;
 | |
|     return (ret);
 | |
| }
 | |
| #endif /* LIBXML_PUSH_ENABLED */
 | |
| 
 | |
| /**
 | |
|  * namePush:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @value:  the element name
 | |
|  *
 | |
|  * DEPRECATED: Internal function, do not use.
 | |
|  *
 | |
|  * Pushes a new element name on top of the name stack
 | |
|  *
 | |
|  * Returns -1 in case of error, the index in the stack otherwise
 | |
|  */
 | |
| int
 | |
| namePush(xmlParserCtxtPtr ctxt, const xmlChar * value)
 | |
| {
 | |
|     if (ctxt == NULL) return (-1);
 | |
| 
 | |
|     if (ctxt->nameNr >= ctxt->nameMax) {
 | |
|         const xmlChar * *tmp;
 | |
|         tmp = (const xmlChar * *) xmlRealloc((xmlChar * *)ctxt->nameTab,
 | |
|                                     ctxt->nameMax * 2 *
 | |
|                                     sizeof(ctxt->nameTab[0]));
 | |
|         if (tmp == NULL) {
 | |
| 	    goto mem_error;
 | |
|         }
 | |
| 	ctxt->nameTab = tmp;
 | |
|         ctxt->nameMax *= 2;
 | |
|     }
 | |
|     ctxt->nameTab[ctxt->nameNr] = value;
 | |
|     ctxt->name = value;
 | |
|     return (ctxt->nameNr++);
 | |
| mem_error:
 | |
|     xmlErrMemory(ctxt, NULL);
 | |
|     return (-1);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * namePop:
 | |
|  * @ctxt: an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, do not use.
 | |
|  *
 | |
|  * Pops the top element name from the name stack
 | |
|  *
 | |
|  * Returns the name just removed
 | |
|  */
 | |
| const xmlChar *
 | |
| namePop(xmlParserCtxtPtr ctxt)
 | |
| {
 | |
|     const xmlChar *ret;
 | |
| 
 | |
|     if ((ctxt == NULL) || (ctxt->nameNr <= 0))
 | |
|         return (NULL);
 | |
|     ctxt->nameNr--;
 | |
|     if (ctxt->nameNr > 0)
 | |
|         ctxt->name = ctxt->nameTab[ctxt->nameNr - 1];
 | |
|     else
 | |
|         ctxt->name = NULL;
 | |
|     ret = ctxt->nameTab[ctxt->nameNr];
 | |
|     ctxt->nameTab[ctxt->nameNr] = NULL;
 | |
|     return (ret);
 | |
| }
 | |
| 
 | |
| static int spacePush(xmlParserCtxtPtr ctxt, int val) {
 | |
|     if (ctxt->spaceNr >= ctxt->spaceMax) {
 | |
|         int *tmp;
 | |
| 
 | |
| 	ctxt->spaceMax *= 2;
 | |
|         tmp = (int *) xmlRealloc(ctxt->spaceTab,
 | |
| 	                         ctxt->spaceMax * sizeof(ctxt->spaceTab[0]));
 | |
|         if (tmp == NULL) {
 | |
| 	    xmlErrMemory(ctxt, NULL);
 | |
| 	    ctxt->spaceMax /=2;
 | |
| 	    return(-1);
 | |
| 	}
 | |
| 	ctxt->spaceTab = tmp;
 | |
|     }
 | |
|     ctxt->spaceTab[ctxt->spaceNr] = val;
 | |
|     ctxt->space = &ctxt->spaceTab[ctxt->spaceNr];
 | |
|     return(ctxt->spaceNr++);
 | |
| }
 | |
| 
 | |
| static int spacePop(xmlParserCtxtPtr ctxt) {
 | |
|     int ret;
 | |
|     if (ctxt->spaceNr <= 0) return(0);
 | |
|     ctxt->spaceNr--;
 | |
|     if (ctxt->spaceNr > 0)
 | |
| 	ctxt->space = &ctxt->spaceTab[ctxt->spaceNr - 1];
 | |
|     else
 | |
|         ctxt->space = &ctxt->spaceTab[0];
 | |
|     ret = ctxt->spaceTab[ctxt->spaceNr];
 | |
|     ctxt->spaceTab[ctxt->spaceNr] = -1;
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Macros for accessing the content. Those should be used only by the parser,
 | |
|  * and not exported.
 | |
|  *
 | |
|  * Dirty macros, i.e. one often need to make assumption on the context to
 | |
|  * use them
 | |
|  *
 | |
|  *   CUR_PTR return the current pointer to the xmlChar to be parsed.
 | |
|  *           To be used with extreme caution since operations consuming
 | |
|  *           characters may move the input buffer to a different location !
 | |
|  *   CUR     returns the current xmlChar value, i.e. a 8 bit value if compiled
 | |
|  *           This should be used internally by the parser
 | |
|  *           only to compare to ASCII values otherwise it would break when
 | |
|  *           running with UTF-8 encoding.
 | |
|  *   RAW     same as CUR but in the input buffer, bypass any token
 | |
|  *           extraction that may have been done
 | |
|  *   NXT(n)  returns the n'th next xmlChar. Same as CUR is should be used only
 | |
|  *           to compare on ASCII based substring.
 | |
|  *   SKIP(n) Skip n xmlChar, and must also be used only to skip ASCII defined
 | |
|  *           strings without newlines within the parser.
 | |
|  *   NEXT1(l) Skip 1 xmlChar, and must also be used only to skip 1 non-newline ASCII
 | |
|  *           defined char within the parser.
 | |
|  * Clean macros, not dependent of an ASCII context, expect UTF-8 encoding
 | |
|  *
 | |
|  *   NEXT    Skip to the next character, this does the proper decoding
 | |
|  *           in UTF-8 mode. It also pop-up unfinished entities on the fly.
 | |
|  *   NEXTL(l) Skip the current unicode character of l xmlChars long.
 | |
|  *   CUR_CHAR(l) returns the current unicode character (int), set l
 | |
|  *           to the number of xmlChars used for the encoding [0-5].
 | |
|  *   CUR_SCHAR  same but operate on a string instead of the context
 | |
|  *   COPY_BUF  copy the current unicode char to the target buffer, increment
 | |
|  *            the index
 | |
|  *   GROW, SHRINK  handling of input buffers
 | |
|  */
 | |
| 
 | |
| #define RAW (*ctxt->input->cur)
 | |
| #define CUR (*ctxt->input->cur)
 | |
| #define NXT(val) ctxt->input->cur[(val)]
 | |
| #define CUR_PTR ctxt->input->cur
 | |
| #define BASE_PTR ctxt->input->base
 | |
| 
 | |
| #define CMP4( s, c1, c2, c3, c4 ) \
 | |
|   ( ((unsigned char *) s)[ 0 ] == c1 && ((unsigned char *) s)[ 1 ] == c2 && \
 | |
|     ((unsigned char *) s)[ 2 ] == c3 && ((unsigned char *) s)[ 3 ] == c4 )
 | |
| #define CMP5( s, c1, c2, c3, c4, c5 ) \
 | |
|   ( CMP4( s, c1, c2, c3, c4 ) && ((unsigned char *) s)[ 4 ] == c5 )
 | |
| #define CMP6( s, c1, c2, c3, c4, c5, c6 ) \
 | |
|   ( CMP5( s, c1, c2, c3, c4, c5 ) && ((unsigned char *) s)[ 5 ] == c6 )
 | |
| #define CMP7( s, c1, c2, c3, c4, c5, c6, c7 ) \
 | |
|   ( CMP6( s, c1, c2, c3, c4, c5, c6 ) && ((unsigned char *) s)[ 6 ] == c7 )
 | |
| #define CMP8( s, c1, c2, c3, c4, c5, c6, c7, c8 ) \
 | |
|   ( CMP7( s, c1, c2, c3, c4, c5, c6, c7 ) && ((unsigned char *) s)[ 7 ] == c8 )
 | |
| #define CMP9( s, c1, c2, c3, c4, c5, c6, c7, c8, c9 ) \
 | |
|   ( CMP8( s, c1, c2, c3, c4, c5, c6, c7, c8 ) && \
 | |
|     ((unsigned char *) s)[ 8 ] == c9 )
 | |
| #define CMP10( s, c1, c2, c3, c4, c5, c6, c7, c8, c9, c10 ) \
 | |
|   ( CMP9( s, c1, c2, c3, c4, c5, c6, c7, c8, c9 ) && \
 | |
|     ((unsigned char *) s)[ 9 ] == c10 )
 | |
| 
 | |
| #define SKIP(val) do {							\
 | |
|     ctxt->input->cur += (val),ctxt->input->col+=(val);			\
 | |
|     if (*ctxt->input->cur == 0)						\
 | |
|         xmlParserGrow(ctxt);						\
 | |
|   } while (0)
 | |
| 
 | |
| #define SKIPL(val) do {							\
 | |
|     int skipl;								\
 | |
|     for(skipl=0; skipl<val; skipl++) {					\
 | |
| 	if (*(ctxt->input->cur) == '\n') {				\
 | |
| 	ctxt->input->line++; ctxt->input->col = 1;			\
 | |
| 	} else ctxt->input->col++;					\
 | |
| 	ctxt->input->cur++;						\
 | |
|     }									\
 | |
|     if (*ctxt->input->cur == 0)						\
 | |
|         xmlParserGrow(ctxt);						\
 | |
|   } while (0)
 | |
| 
 | |
| /* Don't shrink push parser buffer. */
 | |
| #define SHRINK \
 | |
|     if (((ctxt->progressive == 0) || (ctxt->inputNr > 1)) && \
 | |
|         (ctxt->input->cur - ctxt->input->base > 2 * INPUT_CHUNK) && \
 | |
| 	(ctxt->input->end - ctxt->input->cur < 2 * INPUT_CHUNK)) \
 | |
| 	xmlParserShrink(ctxt);
 | |
| 
 | |
| #define GROW if (ctxt->input->end - ctxt->input->cur < INPUT_CHUNK)	\
 | |
| 	xmlParserGrow(ctxt);
 | |
| 
 | |
| #define SKIP_BLANKS xmlSkipBlankChars(ctxt)
 | |
| 
 | |
| #define NEXT xmlNextChar(ctxt)
 | |
| 
 | |
| #define NEXT1 {								\
 | |
| 	ctxt->input->col++;						\
 | |
| 	ctxt->input->cur++;						\
 | |
| 	if (*ctxt->input->cur == 0)					\
 | |
| 	    xmlParserGrow(ctxt);						\
 | |
|     }
 | |
| 
 | |
| #define NEXTL(l) do {							\
 | |
|     if (*(ctxt->input->cur) == '\n') {					\
 | |
| 	ctxt->input->line++; ctxt->input->col = 1;			\
 | |
|     } else ctxt->input->col++;						\
 | |
|     ctxt->input->cur += l;				\
 | |
|   } while (0)
 | |
| 
 | |
| #define CUR_CHAR(l) xmlCurrentChar(ctxt, &l)
 | |
| #define CUR_SCHAR(s, l) xmlStringCurrentChar(ctxt, s, &l)
 | |
| 
 | |
| #define COPY_BUF(b, i, v)						\
 | |
|     if (v < 0x80) b[i++] = v;						\
 | |
|     else i += xmlCopyCharMultiByte(&b[i],v)
 | |
| 
 | |
| /**
 | |
|  * xmlSkipBlankChars:
 | |
|  * @ctxt:  the XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, do not use.
 | |
|  *
 | |
|  * skip all blanks character found at that point in the input streams.
 | |
|  * It pops up finished entities in the process if allowable at that point.
 | |
|  *
 | |
|  * Returns the number of space chars skipped
 | |
|  */
 | |
| 
 | |
| int
 | |
| xmlSkipBlankChars(xmlParserCtxtPtr ctxt) {
 | |
|     int res = 0;
 | |
| 
 | |
|     /*
 | |
|      * It's Okay to use CUR/NEXT here since all the blanks are on
 | |
|      * the ASCII range.
 | |
|      */
 | |
|     if (((ctxt->inputNr == 1) && (ctxt->instate != XML_PARSER_DTD)) ||
 | |
|         (ctxt->instate == XML_PARSER_START)) {
 | |
| 	const xmlChar *cur;
 | |
| 	/*
 | |
| 	 * if we are in the document content, go really fast
 | |
| 	 */
 | |
| 	cur = ctxt->input->cur;
 | |
| 	while (IS_BLANK_CH(*cur)) {
 | |
| 	    if (*cur == '\n') {
 | |
| 		ctxt->input->line++; ctxt->input->col = 1;
 | |
| 	    } else {
 | |
| 		ctxt->input->col++;
 | |
| 	    }
 | |
| 	    cur++;
 | |
| 	    if (res < INT_MAX)
 | |
| 		res++;
 | |
| 	    if (*cur == 0) {
 | |
| 		ctxt->input->cur = cur;
 | |
| 		xmlParserGrow(ctxt);
 | |
| 		cur = ctxt->input->cur;
 | |
| 	    }
 | |
| 	}
 | |
| 	ctxt->input->cur = cur;
 | |
|     } else {
 | |
|         int expandPE = ((ctxt->external != 0) || (ctxt->inputNr != 1));
 | |
| 
 | |
| 	while (ctxt->instate != XML_PARSER_EOF) {
 | |
|             if (IS_BLANK_CH(CUR)) { /* CHECKED tstblanks.xml */
 | |
| 		NEXT;
 | |
| 	    } else if (CUR == '%') {
 | |
|                 /*
 | |
|                  * Need to handle support of entities branching here
 | |
|                  */
 | |
| 	        if ((expandPE == 0) || (IS_BLANK_CH(NXT(1))) || (NXT(1) == 0))
 | |
|                     break;
 | |
| 	        xmlParsePEReference(ctxt);
 | |
|             } else if (CUR == 0) {
 | |
|                 unsigned long consumed;
 | |
|                 xmlEntityPtr ent;
 | |
| 
 | |
|                 if (ctxt->inputNr <= 1)
 | |
|                     break;
 | |
| 
 | |
|                 consumed = ctxt->input->consumed;
 | |
|                 xmlSaturatedAddSizeT(&consumed,
 | |
|                                      ctxt->input->cur - ctxt->input->base);
 | |
| 
 | |
|                 /*
 | |
|                  * Add to sizeentities when parsing an external entity
 | |
|                  * for the first time.
 | |
|                  */
 | |
|                 ent = ctxt->input->entity;
 | |
|                 if ((ent->etype == XML_EXTERNAL_PARAMETER_ENTITY) &&
 | |
|                     ((ent->flags & XML_ENT_PARSED) == 0)) {
 | |
|                     ent->flags |= XML_ENT_PARSED;
 | |
| 
 | |
|                     xmlSaturatedAdd(&ctxt->sizeentities, consumed);
 | |
|                 }
 | |
| 
 | |
|                 xmlParserEntityCheck(ctxt, consumed);
 | |
| 
 | |
|                 xmlPopInput(ctxt);
 | |
|             } else {
 | |
|                 break;
 | |
|             }
 | |
| 
 | |
|             /*
 | |
|              * Also increase the counter when entering or exiting a PERef.
 | |
|              * The spec says: "When a parameter-entity reference is recognized
 | |
|              * in the DTD and included, its replacement text MUST be enlarged
 | |
|              * by the attachment of one leading and one following space (#x20)
 | |
|              * character."
 | |
|              */
 | |
| 	    if (res < INT_MAX)
 | |
| 		res++;
 | |
|         }
 | |
|     }
 | |
|     return(res);
 | |
| }
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		Commodity functions to handle entities			*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * xmlPopInput:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * xmlPopInput: the current input pointed by ctxt->input came to an end
 | |
|  *          pop it and return the next char.
 | |
|  *
 | |
|  * Returns the current xmlChar in the parser context
 | |
|  */
 | |
| xmlChar
 | |
| xmlPopInput(xmlParserCtxtPtr ctxt) {
 | |
|     xmlParserInputPtr input;
 | |
| 
 | |
|     if ((ctxt == NULL) || (ctxt->inputNr <= 1)) return(0);
 | |
|     if (xmlParserDebugEntities)
 | |
| 	xmlGenericError(xmlGenericErrorContext,
 | |
| 		"Popping input %d\n", ctxt->inputNr);
 | |
|     if ((ctxt->inputNr > 1) && (ctxt->inSubset == 0) &&
 | |
|         (ctxt->instate != XML_PARSER_EOF))
 | |
|         xmlFatalErr(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
|                     "Unfinished entity outside the DTD");
 | |
|     input = inputPop(ctxt);
 | |
|     if (input->entity != NULL)
 | |
|         input->entity->flags &= ~XML_ENT_EXPANDING;
 | |
|     xmlFreeInputStream(input);
 | |
|     if (*ctxt->input->cur == 0)
 | |
|         xmlParserGrow(ctxt);
 | |
|     return(CUR);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlPushInput:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @input:  an XML parser input fragment (entity, XML fragment ...).
 | |
|  *
 | |
|  * xmlPushInput: switch to a new input stream which is stacked on top
 | |
|  *               of the previous one(s).
 | |
|  * Returns -1 in case of error or the index in the input stack
 | |
|  */
 | |
| int
 | |
| xmlPushInput(xmlParserCtxtPtr ctxt, xmlParserInputPtr input) {
 | |
|     int ret;
 | |
|     if (input == NULL) return(-1);
 | |
| 
 | |
|     if (xmlParserDebugEntities) {
 | |
| 	if ((ctxt->input != NULL) && (ctxt->input->filename))
 | |
| 	    xmlGenericError(xmlGenericErrorContext,
 | |
| 		    "%s(%d): ", ctxt->input->filename,
 | |
| 		    ctxt->input->line);
 | |
| 	xmlGenericError(xmlGenericErrorContext,
 | |
| 		"Pushing input %d : %.30s\n", ctxt->inputNr+1, input->cur);
 | |
|     }
 | |
|     if (((ctxt->inputNr > 40) && ((ctxt->options & XML_PARSE_HUGE) == 0)) ||
 | |
|         (ctxt->inputNr > 100)) {
 | |
|         xmlFatalErr(ctxt, XML_ERR_ENTITY_LOOP, NULL);
 | |
|         while (ctxt->inputNr > 1)
 | |
|             xmlFreeInputStream(inputPop(ctxt));
 | |
| 	return(-1);
 | |
|     }
 | |
|     ret = inputPush(ctxt, input);
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return(-1);
 | |
|     GROW;
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseCharRef:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse a numeric character reference. Always consumes '&'.
 | |
|  *
 | |
|  * [66] CharRef ::= '&#' [0-9]+ ';' |
 | |
|  *                  '&#x' [0-9a-fA-F]+ ';'
 | |
|  *
 | |
|  * [ WFC: Legal Character ]
 | |
|  * Characters referred to using character references must match the
 | |
|  * production for Char.
 | |
|  *
 | |
|  * Returns the value parsed (as an int), 0 in case of error
 | |
|  */
 | |
| int
 | |
| xmlParseCharRef(xmlParserCtxtPtr ctxt) {
 | |
|     int val = 0;
 | |
|     int count = 0;
 | |
| 
 | |
|     /*
 | |
|      * Using RAW/CUR/NEXT is okay since we are working on ASCII range here
 | |
|      */
 | |
|     if ((RAW == '&') && (NXT(1) == '#') &&
 | |
|         (NXT(2) == 'x')) {
 | |
| 	SKIP(3);
 | |
| 	GROW;
 | |
| 	while (RAW != ';') { /* loop blocked by count */
 | |
| 	    if (count++ > 20) {
 | |
| 		count = 0;
 | |
| 		GROW;
 | |
|                 if (ctxt->instate == XML_PARSER_EOF)
 | |
|                     return(0);
 | |
| 	    }
 | |
| 	    if ((RAW >= '0') && (RAW <= '9'))
 | |
| 	        val = val * 16 + (CUR - '0');
 | |
| 	    else if ((RAW >= 'a') && (RAW <= 'f') && (count < 20))
 | |
| 	        val = val * 16 + (CUR - 'a') + 10;
 | |
| 	    else if ((RAW >= 'A') && (RAW <= 'F') && (count < 20))
 | |
| 	        val = val * 16 + (CUR - 'A') + 10;
 | |
| 	    else {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_INVALID_HEX_CHARREF, NULL);
 | |
| 		val = 0;
 | |
| 		break;
 | |
| 	    }
 | |
| 	    if (val > 0x110000)
 | |
| 	        val = 0x110000;
 | |
| 
 | |
| 	    NEXT;
 | |
| 	    count++;
 | |
| 	}
 | |
| 	if (RAW == ';') {
 | |
| 	    /* on purpose to avoid reentrancy problems with NEXT and SKIP */
 | |
| 	    ctxt->input->col++;
 | |
| 	    ctxt->input->cur++;
 | |
| 	}
 | |
|     } else if  ((RAW == '&') && (NXT(1) == '#')) {
 | |
| 	SKIP(2);
 | |
| 	GROW;
 | |
| 	while (RAW != ';') { /* loop blocked by count */
 | |
| 	    if (count++ > 20) {
 | |
| 		count = 0;
 | |
| 		GROW;
 | |
|                 if (ctxt->instate == XML_PARSER_EOF)
 | |
|                     return(0);
 | |
| 	    }
 | |
| 	    if ((RAW >= '0') && (RAW <= '9'))
 | |
| 	        val = val * 10 + (CUR - '0');
 | |
| 	    else {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_INVALID_DEC_CHARREF, NULL);
 | |
| 		val = 0;
 | |
| 		break;
 | |
| 	    }
 | |
| 	    if (val > 0x110000)
 | |
| 	        val = 0x110000;
 | |
| 
 | |
| 	    NEXT;
 | |
| 	    count++;
 | |
| 	}
 | |
| 	if (RAW == ';') {
 | |
| 	    /* on purpose to avoid reentrancy problems with NEXT and SKIP */
 | |
| 	    ctxt->input->col++;
 | |
| 	    ctxt->input->cur++;
 | |
| 	}
 | |
|     } else {
 | |
|         if (RAW == '&')
 | |
|             SKIP(1);
 | |
|         xmlFatalErr(ctxt, XML_ERR_INVALID_CHARREF, NULL);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * [ WFC: Legal Character ]
 | |
|      * Characters referred to using character references must match the
 | |
|      * production for Char.
 | |
|      */
 | |
|     if (val >= 0x110000) {
 | |
|         xmlFatalErrMsgInt(ctxt, XML_ERR_INVALID_CHAR,
 | |
|                 "xmlParseCharRef: character reference out of bounds\n",
 | |
| 	        val);
 | |
|     } else if (IS_CHAR(val)) {
 | |
|         return(val);
 | |
|     } else {
 | |
|         xmlFatalErrMsgInt(ctxt, XML_ERR_INVALID_CHAR,
 | |
|                           "xmlParseCharRef: invalid xmlChar value %d\n",
 | |
| 	                  val);
 | |
|     }
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseStringCharRef:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @str:  a pointer to an index in the string
 | |
|  *
 | |
|  * parse Reference declarations, variant parsing from a string rather
 | |
|  * than an an input flow.
 | |
|  *
 | |
|  * [66] CharRef ::= '&#' [0-9]+ ';' |
 | |
|  *                  '&#x' [0-9a-fA-F]+ ';'
 | |
|  *
 | |
|  * [ WFC: Legal Character ]
 | |
|  * Characters referred to using character references must match the
 | |
|  * production for Char.
 | |
|  *
 | |
|  * Returns the value parsed (as an int), 0 in case of error, str will be
 | |
|  *         updated to the current value of the index
 | |
|  */
 | |
| static int
 | |
| xmlParseStringCharRef(xmlParserCtxtPtr ctxt, const xmlChar **str) {
 | |
|     const xmlChar *ptr;
 | |
|     xmlChar cur;
 | |
|     int val = 0;
 | |
| 
 | |
|     if ((str == NULL) || (*str == NULL)) return(0);
 | |
|     ptr = *str;
 | |
|     cur = *ptr;
 | |
|     if ((cur == '&') && (ptr[1] == '#') && (ptr[2] == 'x')) {
 | |
| 	ptr += 3;
 | |
| 	cur = *ptr;
 | |
| 	while (cur != ';') { /* Non input consuming loop */
 | |
| 	    if ((cur >= '0') && (cur <= '9'))
 | |
| 	        val = val * 16 + (cur - '0');
 | |
| 	    else if ((cur >= 'a') && (cur <= 'f'))
 | |
| 	        val = val * 16 + (cur - 'a') + 10;
 | |
| 	    else if ((cur >= 'A') && (cur <= 'F'))
 | |
| 	        val = val * 16 + (cur - 'A') + 10;
 | |
| 	    else {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_INVALID_HEX_CHARREF, NULL);
 | |
| 		val = 0;
 | |
| 		break;
 | |
| 	    }
 | |
| 	    if (val > 0x110000)
 | |
| 	        val = 0x110000;
 | |
| 
 | |
| 	    ptr++;
 | |
| 	    cur = *ptr;
 | |
| 	}
 | |
| 	if (cur == ';')
 | |
| 	    ptr++;
 | |
|     } else if  ((cur == '&') && (ptr[1] == '#')){
 | |
| 	ptr += 2;
 | |
| 	cur = *ptr;
 | |
| 	while (cur != ';') { /* Non input consuming loops */
 | |
| 	    if ((cur >= '0') && (cur <= '9'))
 | |
| 	        val = val * 10 + (cur - '0');
 | |
| 	    else {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_INVALID_DEC_CHARREF, NULL);
 | |
| 		val = 0;
 | |
| 		break;
 | |
| 	    }
 | |
| 	    if (val > 0x110000)
 | |
| 	        val = 0x110000;
 | |
| 
 | |
| 	    ptr++;
 | |
| 	    cur = *ptr;
 | |
| 	}
 | |
| 	if (cur == ';')
 | |
| 	    ptr++;
 | |
|     } else {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_INVALID_CHARREF, NULL);
 | |
| 	return(0);
 | |
|     }
 | |
|     *str = ptr;
 | |
| 
 | |
|     /*
 | |
|      * [ WFC: Legal Character ]
 | |
|      * Characters referred to using character references must match the
 | |
|      * production for Char.
 | |
|      */
 | |
|     if (val >= 0x110000) {
 | |
|         xmlFatalErrMsgInt(ctxt, XML_ERR_INVALID_CHAR,
 | |
|                 "xmlParseStringCharRef: character reference out of bounds\n",
 | |
|                 val);
 | |
|     } else if (IS_CHAR(val)) {
 | |
|         return(val);
 | |
|     } else {
 | |
|         xmlFatalErrMsgInt(ctxt, XML_ERR_INVALID_CHAR,
 | |
| 			  "xmlParseStringCharRef: invalid xmlChar value %d\n",
 | |
| 			  val);
 | |
|     }
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParserHandlePEReference:
 | |
|  * @ctxt:  the parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, do not use.
 | |
|  *
 | |
|  * [69] PEReference ::= '%' Name ';'
 | |
|  *
 | |
|  * [ WFC: No Recursion ]
 | |
|  * A parsed entity must not contain a recursive
 | |
|  * reference to itself, either directly or indirectly.
 | |
|  *
 | |
|  * [ WFC: Entity Declared ]
 | |
|  * In a document without any DTD, a document with only an internal DTD
 | |
|  * subset which contains no parameter entity references, or a document
 | |
|  * with "standalone='yes'", ...  ... The declaration of a parameter
 | |
|  * entity must precede any reference to it...
 | |
|  *
 | |
|  * [ VC: Entity Declared ]
 | |
|  * In a document with an external subset or external parameter entities
 | |
|  * with "standalone='no'", ...  ... The declaration of a parameter entity
 | |
|  * must precede any reference to it...
 | |
|  *
 | |
|  * [ WFC: In DTD ]
 | |
|  * Parameter-entity references may only appear in the DTD.
 | |
|  * NOTE: misleading but this is handled.
 | |
|  *
 | |
|  * A PEReference may have been detected in the current input stream
 | |
|  * the handling is done accordingly to
 | |
|  *      http://www.w3.org/TR/REC-xml#entproc
 | |
|  * i.e.
 | |
|  *   - Included in literal in entity values
 | |
|  *   - Included as Parameter Entity reference within DTDs
 | |
|  */
 | |
| void
 | |
| xmlParserHandlePEReference(xmlParserCtxtPtr ctxt) {
 | |
|     switch(ctxt->instate) {
 | |
| 	case XML_PARSER_CDATA_SECTION:
 | |
| 	    return;
 | |
|         case XML_PARSER_COMMENT:
 | |
| 	    return;
 | |
| 	case XML_PARSER_START_TAG:
 | |
| 	    return;
 | |
| 	case XML_PARSER_END_TAG:
 | |
| 	    return;
 | |
|         case XML_PARSER_EOF:
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_PEREF_AT_EOF, NULL);
 | |
| 	    return;
 | |
|         case XML_PARSER_PROLOG:
 | |
| 	case XML_PARSER_START:
 | |
| 	case XML_PARSER_XML_DECL:
 | |
| 	case XML_PARSER_MISC:
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_PEREF_IN_PROLOG, NULL);
 | |
| 	    return;
 | |
| 	case XML_PARSER_ENTITY_DECL:
 | |
|         case XML_PARSER_CONTENT:
 | |
|         case XML_PARSER_ATTRIBUTE_VALUE:
 | |
|         case XML_PARSER_PI:
 | |
| 	case XML_PARSER_SYSTEM_LITERAL:
 | |
| 	case XML_PARSER_PUBLIC_LITERAL:
 | |
| 	    /* we just ignore it there */
 | |
| 	    return;
 | |
|         case XML_PARSER_EPILOG:
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_PEREF_IN_EPILOG, NULL);
 | |
| 	    return;
 | |
| 	case XML_PARSER_ENTITY_VALUE:
 | |
| 	    /*
 | |
| 	     * NOTE: in the case of entity values, we don't do the
 | |
| 	     *       substitution here since we need the literal
 | |
| 	     *       entity value to be able to save the internal
 | |
| 	     *       subset of the document.
 | |
| 	     *       This will be handled by xmlStringDecodeEntities
 | |
| 	     */
 | |
| 	    return;
 | |
|         case XML_PARSER_DTD:
 | |
| 	    /*
 | |
| 	     * [WFC: Well-Formedness Constraint: PEs in Internal Subset]
 | |
| 	     * In the internal DTD subset, parameter-entity references
 | |
| 	     * can occur only where markup declarations can occur, not
 | |
| 	     * within markup declarations.
 | |
| 	     * In that case this is handled in xmlParseMarkupDecl
 | |
| 	     */
 | |
| 	    if ((ctxt->external == 0) && (ctxt->inputNr == 1))
 | |
| 		return;
 | |
| 	    if (IS_BLANK_CH(NXT(1)) || NXT(1) == 0)
 | |
| 		return;
 | |
|             break;
 | |
|         case XML_PARSER_IGNORE:
 | |
|             return;
 | |
|     }
 | |
| 
 | |
|     xmlParsePEReference(ctxt);
 | |
| }
 | |
| 
 | |
| /*
 | |
|  * Macro used to grow the current buffer.
 | |
|  * buffer##_size is expected to be a size_t
 | |
|  * mem_error: is expected to handle memory allocation failures
 | |
|  */
 | |
| #define growBuffer(buffer, n) {						\
 | |
|     xmlChar *tmp;							\
 | |
|     size_t new_size = buffer##_size * 2 + n;                            \
 | |
|     if (new_size < buffer##_size) goto mem_error;                       \
 | |
|     tmp = (xmlChar *) xmlRealloc(buffer, new_size);                     \
 | |
|     if (tmp == NULL) goto mem_error;					\
 | |
|     buffer = tmp;							\
 | |
|     buffer##_size = new_size;                                           \
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlStringDecodeEntitiesInt:
 | |
|  * @ctxt:  the parser context
 | |
|  * @str:  the input string
 | |
|  * @len: the string length
 | |
|  * @what:  combination of XML_SUBSTITUTE_REF and XML_SUBSTITUTE_PEREF
 | |
|  * @end:  an end marker xmlChar, 0 if none
 | |
|  * @end2:  an end marker xmlChar, 0 if none
 | |
|  * @end3:  an end marker xmlChar, 0 if none
 | |
|  * @check:  whether to perform entity checks
 | |
|  */
 | |
| static xmlChar *
 | |
| xmlStringDecodeEntitiesInt(xmlParserCtxtPtr ctxt, const xmlChar *str, int len,
 | |
| 		           int what, xmlChar end, xmlChar  end2, xmlChar end3,
 | |
|                            int check) {
 | |
|     xmlChar *buffer = NULL;
 | |
|     size_t buffer_size = 0;
 | |
|     size_t nbchars = 0;
 | |
| 
 | |
|     xmlChar *current = NULL;
 | |
|     xmlChar *rep = NULL;
 | |
|     const xmlChar *last;
 | |
|     xmlEntityPtr ent;
 | |
|     int c,l;
 | |
| 
 | |
|     if (str == NULL)
 | |
|         return(NULL);
 | |
|     last = str + len;
 | |
| 
 | |
|     if (((ctxt->depth > 40) &&
 | |
|          ((ctxt->options & XML_PARSE_HUGE) == 0)) ||
 | |
| 	(ctxt->depth > 100)) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_LOOP,
 | |
|                        "Maximum entity nesting depth exceeded");
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * allocate a translation buffer.
 | |
|      */
 | |
|     buffer_size = XML_PARSER_BIG_BUFFER_SIZE;
 | |
|     buffer = (xmlChar *) xmlMallocAtomic(buffer_size);
 | |
|     if (buffer == NULL) goto mem_error;
 | |
| 
 | |
|     /*
 | |
|      * OK loop until we reach one of the ending char or a size limit.
 | |
|      * we are operating on already parsed values.
 | |
|      */
 | |
|     if (str < last)
 | |
| 	c = CUR_SCHAR(str, l);
 | |
|     else
 | |
|         c = 0;
 | |
|     while ((c != 0) && (c != end) && /* non input consuming loop */
 | |
|            (c != end2) && (c != end3) &&
 | |
|            (ctxt->instate != XML_PARSER_EOF)) {
 | |
| 
 | |
| 	if (c == 0) break;
 | |
|         if ((c == '&') && (str[1] == '#')) {
 | |
| 	    int val = xmlParseStringCharRef(ctxt, &str);
 | |
| 	    if (val == 0)
 | |
|                 goto int_error;
 | |
| 	    COPY_BUF(buffer, nbchars, val);
 | |
| 	    if (nbchars + XML_PARSER_BUFFER_SIZE > buffer_size) {
 | |
| 	        growBuffer(buffer, XML_PARSER_BUFFER_SIZE);
 | |
| 	    }
 | |
| 	} else if ((c == '&') && (what & XML_SUBSTITUTE_REF)) {
 | |
| 	    if (xmlParserDebugEntities)
 | |
| 		xmlGenericError(xmlGenericErrorContext,
 | |
| 			"String decoding Entity Reference: %.30s\n",
 | |
| 			str);
 | |
| 	    ent = xmlParseStringEntityRef(ctxt, &str);
 | |
| 	    if ((ent != NULL) &&
 | |
| 		(ent->etype == XML_INTERNAL_PREDEFINED_ENTITY)) {
 | |
| 		if (ent->content != NULL) {
 | |
| 		    COPY_BUF(buffer, nbchars, ent->content[0]);
 | |
| 		    if (nbchars + XML_PARSER_BUFFER_SIZE > buffer_size) {
 | |
| 			growBuffer(buffer, XML_PARSER_BUFFER_SIZE);
 | |
| 		    }
 | |
| 		} else {
 | |
| 		    xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
| 			    "predefined entity has no content\n");
 | |
|                     goto int_error;
 | |
| 		}
 | |
| 	    } else if ((ent != NULL) && (ent->content != NULL)) {
 | |
| 	        if ((check) && (xmlParserEntityCheck(ctxt, ent->length)))
 | |
|                     goto int_error;
 | |
| 
 | |
|                 if (ent->flags & XML_ENT_EXPANDING) {
 | |
| 	            xmlFatalErr(ctxt, XML_ERR_ENTITY_LOOP, NULL);
 | |
|                     xmlHaltParser(ctxt);
 | |
|                     ent->content[0] = 0;
 | |
|                     goto int_error;
 | |
|                 }
 | |
| 
 | |
|                 ent->flags |= XML_ENT_EXPANDING;
 | |
| 		ctxt->depth++;
 | |
| 		rep = xmlStringDecodeEntitiesInt(ctxt, ent->content,
 | |
|                         ent->length, what, 0, 0, 0, check);
 | |
| 		ctxt->depth--;
 | |
|                 ent->flags &= ~XML_ENT_EXPANDING;
 | |
| 
 | |
| 		if (rep == NULL) {
 | |
|                     ent->content[0] = 0;
 | |
|                     goto int_error;
 | |
|                 }
 | |
| 
 | |
|                 current = rep;
 | |
|                 while (*current != 0) { /* non input consuming loop */
 | |
|                     buffer[nbchars++] = *current++;
 | |
|                     if (nbchars + XML_PARSER_BUFFER_SIZE > buffer_size) {
 | |
|                         growBuffer(buffer, XML_PARSER_BUFFER_SIZE);
 | |
|                     }
 | |
|                 }
 | |
|                 xmlFree(rep);
 | |
|                 rep = NULL;
 | |
| 	    } else if (ent != NULL) {
 | |
| 		int i = xmlStrlen(ent->name);
 | |
| 		const xmlChar *cur = ent->name;
 | |
| 
 | |
| 		buffer[nbchars++] = '&';
 | |
| 		if (nbchars + i + XML_PARSER_BUFFER_SIZE > buffer_size) {
 | |
| 		    growBuffer(buffer, i + XML_PARSER_BUFFER_SIZE);
 | |
| 		}
 | |
| 		for (;i > 0;i--)
 | |
| 		    buffer[nbchars++] = *cur++;
 | |
| 		buffer[nbchars++] = ';';
 | |
| 	    }
 | |
| 	} else if (c == '%' && (what & XML_SUBSTITUTE_PEREF)) {
 | |
| 	    if (xmlParserDebugEntities)
 | |
| 		xmlGenericError(xmlGenericErrorContext,
 | |
| 			"String decoding PE Reference: %.30s\n", str);
 | |
| 	    ent = xmlParseStringPEReference(ctxt, &str);
 | |
| 	    if (ent != NULL) {
 | |
|                 if (ent->content == NULL) {
 | |
| 		    /*
 | |
| 		     * Note: external parsed entities will not be loaded,
 | |
| 		     * it is not required for a non-validating parser to
 | |
| 		     * complete external PEReferences coming from the
 | |
| 		     * internal subset
 | |
| 		     */
 | |
| 		    if (((ctxt->options & XML_PARSE_NOENT) != 0) ||
 | |
| 			((ctxt->options & XML_PARSE_DTDVALID) != 0) ||
 | |
| 			(ctxt->validate != 0)) {
 | |
| 			xmlLoadEntityContent(ctxt, ent);
 | |
| 		    } else {
 | |
| 			xmlWarningMsg(ctxt, XML_ERR_ENTITY_PROCESSING,
 | |
| 		  "not validating will not read content for PE entity %s\n",
 | |
| 		                      ent->name, NULL);
 | |
| 		    }
 | |
| 		}
 | |
| 
 | |
| 	        if ((check) && (xmlParserEntityCheck(ctxt, ent->length)))
 | |
|                     goto int_error;
 | |
| 
 | |
|                 if (ent->flags & XML_ENT_EXPANDING) {
 | |
| 	            xmlFatalErr(ctxt, XML_ERR_ENTITY_LOOP, NULL);
 | |
|                     xmlHaltParser(ctxt);
 | |
|                     if (ent->content != NULL)
 | |
|                         ent->content[0] = 0;
 | |
|                     goto int_error;
 | |
|                 }
 | |
| 
 | |
|                 ent->flags |= XML_ENT_EXPANDING;
 | |
| 		ctxt->depth++;
 | |
| 		rep = xmlStringDecodeEntitiesInt(ctxt, ent->content,
 | |
|                         ent->length, what, 0, 0, 0, check);
 | |
| 		ctxt->depth--;
 | |
|                 ent->flags &= ~XML_ENT_EXPANDING;
 | |
| 
 | |
| 		if (rep == NULL) {
 | |
|                     if (ent->content != NULL)
 | |
|                         ent->content[0] = 0;
 | |
|                     goto int_error;
 | |
|                 }
 | |
|                 current = rep;
 | |
|                 while (*current != 0) { /* non input consuming loop */
 | |
|                     buffer[nbchars++] = *current++;
 | |
|                     if (nbchars + XML_PARSER_BUFFER_SIZE > buffer_size) {
 | |
|                         growBuffer(buffer, XML_PARSER_BUFFER_SIZE);
 | |
|                     }
 | |
|                 }
 | |
|                 xmlFree(rep);
 | |
|                 rep = NULL;
 | |
| 	    }
 | |
| 	} else {
 | |
| 	    COPY_BUF(buffer, nbchars, c);
 | |
| 	    str += l;
 | |
| 	    if (nbchars + XML_PARSER_BUFFER_SIZE > buffer_size) {
 | |
| 	        growBuffer(buffer, XML_PARSER_BUFFER_SIZE);
 | |
| 	    }
 | |
| 	}
 | |
| 	if (str < last)
 | |
| 	    c = CUR_SCHAR(str, l);
 | |
| 	else
 | |
| 	    c = 0;
 | |
|     }
 | |
|     buffer[nbchars] = 0;
 | |
|     return(buffer);
 | |
| 
 | |
| mem_error:
 | |
|     xmlErrMemory(ctxt, NULL);
 | |
| int_error:
 | |
|     if (rep != NULL)
 | |
|         xmlFree(rep);
 | |
|     if (buffer != NULL)
 | |
|         xmlFree(buffer);
 | |
|     return(NULL);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlStringLenDecodeEntities:
 | |
|  * @ctxt:  the parser context
 | |
|  * @str:  the input string
 | |
|  * @len: the string length
 | |
|  * @what:  combination of XML_SUBSTITUTE_REF and XML_SUBSTITUTE_PEREF
 | |
|  * @end:  an end marker xmlChar, 0 if none
 | |
|  * @end2:  an end marker xmlChar, 0 if none
 | |
|  * @end3:  an end marker xmlChar, 0 if none
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Takes a entity string content and process to do the adequate substitutions.
 | |
|  *
 | |
|  * [67] Reference ::= EntityRef | CharRef
 | |
|  *
 | |
|  * [69] PEReference ::= '%' Name ';'
 | |
|  *
 | |
|  * Returns A newly allocated string with the substitution done. The caller
 | |
|  *      must deallocate it !
 | |
|  */
 | |
| xmlChar *
 | |
| xmlStringLenDecodeEntities(xmlParserCtxtPtr ctxt, const xmlChar *str, int len,
 | |
|                            int what, xmlChar end, xmlChar  end2,
 | |
|                            xmlChar end3) {
 | |
|     if ((ctxt == NULL) || (str == NULL) || (len < 0))
 | |
|         return(NULL);
 | |
|     return(xmlStringDecodeEntitiesInt(ctxt, str, len, what,
 | |
|                                       end, end2, end3, 0));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlStringDecodeEntities:
 | |
|  * @ctxt:  the parser context
 | |
|  * @str:  the input string
 | |
|  * @what:  combination of XML_SUBSTITUTE_REF and XML_SUBSTITUTE_PEREF
 | |
|  * @end:  an end marker xmlChar, 0 if none
 | |
|  * @end2:  an end marker xmlChar, 0 if none
 | |
|  * @end3:  an end marker xmlChar, 0 if none
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Takes a entity string content and process to do the adequate substitutions.
 | |
|  *
 | |
|  * [67] Reference ::= EntityRef | CharRef
 | |
|  *
 | |
|  * [69] PEReference ::= '%' Name ';'
 | |
|  *
 | |
|  * Returns A newly allocated string with the substitution done. The caller
 | |
|  *      must deallocate it !
 | |
|  */
 | |
| xmlChar *
 | |
| xmlStringDecodeEntities(xmlParserCtxtPtr ctxt, const xmlChar *str, int what,
 | |
| 		        xmlChar end, xmlChar  end2, xmlChar end3) {
 | |
|     if ((ctxt == NULL) || (str == NULL)) return(NULL);
 | |
|     return(xmlStringDecodeEntitiesInt(ctxt, str, xmlStrlen(str), what,
 | |
|                                       end, end2, end3, 0));
 | |
| }
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		Commodity functions, cleanup needed ?			*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * areBlanks:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @str:  a xmlChar *
 | |
|  * @len:  the size of @str
 | |
|  * @blank_chars: we know the chars are blanks
 | |
|  *
 | |
|  * Is this a sequence of blank chars that one can ignore ?
 | |
|  *
 | |
|  * Returns 1 if ignorable 0 otherwise.
 | |
|  */
 | |
| 
 | |
| static int areBlanks(xmlParserCtxtPtr ctxt, const xmlChar *str, int len,
 | |
|                      int blank_chars) {
 | |
|     int i, ret;
 | |
|     xmlNodePtr lastChild;
 | |
| 
 | |
|     /*
 | |
|      * Don't spend time trying to differentiate them, the same callback is
 | |
|      * used !
 | |
|      */
 | |
|     if (ctxt->sax->ignorableWhitespace == ctxt->sax->characters)
 | |
| 	return(0);
 | |
| 
 | |
|     /*
 | |
|      * Check for xml:space value.
 | |
|      */
 | |
|     if ((ctxt->space == NULL) || (*(ctxt->space) == 1) ||
 | |
|         (*(ctxt->space) == -2))
 | |
| 	return(0);
 | |
| 
 | |
|     /*
 | |
|      * Check that the string is made of blanks
 | |
|      */
 | |
|     if (blank_chars == 0) {
 | |
| 	for (i = 0;i < len;i++)
 | |
| 	    if (!(IS_BLANK_CH(str[i]))) return(0);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Look if the element is mixed content in the DTD if available
 | |
|      */
 | |
|     if (ctxt->node == NULL) return(0);
 | |
|     if (ctxt->myDoc != NULL) {
 | |
| 	ret = xmlIsMixedElement(ctxt->myDoc, ctxt->node->name);
 | |
|         if (ret == 0) return(1);
 | |
|         if (ret == 1) return(0);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Otherwise, heuristic :-\
 | |
|      */
 | |
|     if ((RAW != '<') && (RAW != 0xD)) return(0);
 | |
|     if ((ctxt->node->children == NULL) &&
 | |
| 	(RAW == '<') && (NXT(1) == '/')) return(0);
 | |
| 
 | |
|     lastChild = xmlGetLastChild(ctxt->node);
 | |
|     if (lastChild == NULL) {
 | |
|         if ((ctxt->node->type != XML_ELEMENT_NODE) &&
 | |
|             (ctxt->node->content != NULL)) return(0);
 | |
|     } else if (xmlNodeIsText(lastChild))
 | |
|         return(0);
 | |
|     else if ((ctxt->node->children != NULL) &&
 | |
|              (xmlNodeIsText(ctxt->node->children)))
 | |
|         return(0);
 | |
|     return(1);
 | |
| }
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		Extra stuff for namespace support			*
 | |
|  *	Relates to http://www.w3.org/TR/WD-xml-names			*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * xmlSplitQName:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @name:  an XML parser context
 | |
|  * @prefix:  a xmlChar **
 | |
|  *
 | |
|  * parse an UTF8 encoded XML qualified name string
 | |
|  *
 | |
|  * [NS 5] QName ::= (Prefix ':')? LocalPart
 | |
|  *
 | |
|  * [NS 6] Prefix ::= NCName
 | |
|  *
 | |
|  * [NS 7] LocalPart ::= NCName
 | |
|  *
 | |
|  * Returns the local part, and prefix is updated
 | |
|  *   to get the Prefix if any.
 | |
|  */
 | |
| 
 | |
| xmlChar *
 | |
| xmlSplitQName(xmlParserCtxtPtr ctxt, const xmlChar *name, xmlChar **prefix) {
 | |
|     xmlChar buf[XML_MAX_NAMELEN + 5];
 | |
|     xmlChar *buffer = NULL;
 | |
|     int len = 0;
 | |
|     int max = XML_MAX_NAMELEN;
 | |
|     xmlChar *ret = NULL;
 | |
|     const xmlChar *cur = name;
 | |
|     int c;
 | |
| 
 | |
|     if (prefix == NULL) return(NULL);
 | |
|     *prefix = NULL;
 | |
| 
 | |
|     if (cur == NULL) return(NULL);
 | |
| 
 | |
| #ifndef XML_XML_NAMESPACE
 | |
|     /* xml: prefix is not really a namespace */
 | |
|     if ((cur[0] == 'x') && (cur[1] == 'm') &&
 | |
|         (cur[2] == 'l') && (cur[3] == ':'))
 | |
| 	return(xmlStrdup(name));
 | |
| #endif
 | |
| 
 | |
|     /* nasty but well=formed */
 | |
|     if (cur[0] == ':')
 | |
| 	return(xmlStrdup(name));
 | |
| 
 | |
|     c = *cur++;
 | |
|     while ((c != 0) && (c != ':') && (len < max)) { /* tested bigname.xml */
 | |
| 	buf[len++] = c;
 | |
| 	c = *cur++;
 | |
|     }
 | |
|     if (len >= max) {
 | |
| 	/*
 | |
| 	 * Okay someone managed to make a huge name, so he's ready to pay
 | |
| 	 * for the processing speed.
 | |
| 	 */
 | |
| 	max = len * 2;
 | |
| 
 | |
| 	buffer = (xmlChar *) xmlMallocAtomic(max);
 | |
| 	if (buffer == NULL) {
 | |
| 	    xmlErrMemory(ctxt, NULL);
 | |
| 	    return(NULL);
 | |
| 	}
 | |
| 	memcpy(buffer, buf, len);
 | |
| 	while ((c != 0) && (c != ':')) { /* tested bigname.xml */
 | |
| 	    if (len + 10 > max) {
 | |
| 	        xmlChar *tmp;
 | |
| 
 | |
| 		max *= 2;
 | |
| 		tmp = (xmlChar *) xmlRealloc(buffer, max);
 | |
| 		if (tmp == NULL) {
 | |
| 		    xmlFree(buffer);
 | |
| 		    xmlErrMemory(ctxt, NULL);
 | |
| 		    return(NULL);
 | |
| 		}
 | |
| 		buffer = tmp;
 | |
| 	    }
 | |
| 	    buffer[len++] = c;
 | |
| 	    c = *cur++;
 | |
| 	}
 | |
| 	buffer[len] = 0;
 | |
|     }
 | |
| 
 | |
|     if ((c == ':') && (*cur == 0)) {
 | |
|         if (buffer != NULL)
 | |
| 	    xmlFree(buffer);
 | |
| 	*prefix = NULL;
 | |
| 	return(xmlStrdup(name));
 | |
|     }
 | |
| 
 | |
|     if (buffer == NULL)
 | |
| 	ret = xmlStrndup(buf, len);
 | |
|     else {
 | |
| 	ret = buffer;
 | |
| 	buffer = NULL;
 | |
| 	max = XML_MAX_NAMELEN;
 | |
|     }
 | |
| 
 | |
| 
 | |
|     if (c == ':') {
 | |
| 	c = *cur;
 | |
|         *prefix = ret;
 | |
| 	if (c == 0) {
 | |
| 	    return(xmlStrndup(BAD_CAST "", 0));
 | |
| 	}
 | |
| 	len = 0;
 | |
| 
 | |
| 	/*
 | |
| 	 * Check that the first character is proper to start
 | |
| 	 * a new name
 | |
| 	 */
 | |
| 	if (!(((c >= 0x61) && (c <= 0x7A)) ||
 | |
| 	      ((c >= 0x41) && (c <= 0x5A)) ||
 | |
| 	      (c == '_') || (c == ':'))) {
 | |
| 	    int l;
 | |
| 	    int first = CUR_SCHAR(cur, l);
 | |
| 
 | |
| 	    if (!IS_LETTER(first) && (first != '_')) {
 | |
| 		xmlFatalErrMsgStr(ctxt, XML_NS_ERR_QNAME,
 | |
| 			    "Name %s is not XML Namespace compliant\n",
 | |
| 				  name);
 | |
| 	    }
 | |
| 	}
 | |
| 	cur++;
 | |
| 
 | |
| 	while ((c != 0) && (len < max)) { /* tested bigname2.xml */
 | |
| 	    buf[len++] = c;
 | |
| 	    c = *cur++;
 | |
| 	}
 | |
| 	if (len >= max) {
 | |
| 	    /*
 | |
| 	     * Okay someone managed to make a huge name, so he's ready to pay
 | |
| 	     * for the processing speed.
 | |
| 	     */
 | |
| 	    max = len * 2;
 | |
| 
 | |
| 	    buffer = (xmlChar *) xmlMallocAtomic(max);
 | |
| 	    if (buffer == NULL) {
 | |
| 	        xmlErrMemory(ctxt, NULL);
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    memcpy(buffer, buf, len);
 | |
| 	    while (c != 0) { /* tested bigname2.xml */
 | |
| 		if (len + 10 > max) {
 | |
| 		    xmlChar *tmp;
 | |
| 
 | |
| 		    max *= 2;
 | |
| 		    tmp = (xmlChar *) xmlRealloc(buffer, max);
 | |
| 		    if (tmp == NULL) {
 | |
| 			xmlErrMemory(ctxt, NULL);
 | |
| 			xmlFree(buffer);
 | |
| 			return(NULL);
 | |
| 		    }
 | |
| 		    buffer = tmp;
 | |
| 		}
 | |
| 		buffer[len++] = c;
 | |
| 		c = *cur++;
 | |
| 	    }
 | |
| 	    buffer[len] = 0;
 | |
| 	}
 | |
| 
 | |
| 	if (buffer == NULL)
 | |
| 	    ret = xmlStrndup(buf, len);
 | |
| 	else {
 | |
| 	    ret = buffer;
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *			The parser itself				*
 | |
|  *	Relates to http://www.w3.org/TR/REC-xml				*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *	Routines to parse Name, NCName and NmToken			*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /*
 | |
|  * The two following functions are related to the change of accepted
 | |
|  * characters for Name and NmToken in the Revision 5 of XML-1.0
 | |
|  * They correspond to the modified production [4] and the new production [4a]
 | |
|  * changes in that revision. Also note that the macros used for the
 | |
|  * productions Letter, Digit, CombiningChar and Extender are not needed
 | |
|  * anymore.
 | |
|  * We still keep compatibility to pre-revision5 parsing semantic if the
 | |
|  * new XML_PARSE_OLD10 option is given to the parser.
 | |
|  */
 | |
| static int
 | |
| xmlIsNameStartChar(xmlParserCtxtPtr ctxt, int c) {
 | |
|     if ((ctxt->options & XML_PARSE_OLD10) == 0) {
 | |
|         /*
 | |
| 	 * Use the new checks of production [4] [4a] amd [5] of the
 | |
| 	 * Update 5 of XML-1.0
 | |
| 	 */
 | |
| 	if ((c != ' ') && (c != '>') && (c != '/') && /* accelerators */
 | |
| 	    (((c >= 'a') && (c <= 'z')) ||
 | |
| 	     ((c >= 'A') && (c <= 'Z')) ||
 | |
| 	     (c == '_') || (c == ':') ||
 | |
| 	     ((c >= 0xC0) && (c <= 0xD6)) ||
 | |
| 	     ((c >= 0xD8) && (c <= 0xF6)) ||
 | |
| 	     ((c >= 0xF8) && (c <= 0x2FF)) ||
 | |
| 	     ((c >= 0x370) && (c <= 0x37D)) ||
 | |
| 	     ((c >= 0x37F) && (c <= 0x1FFF)) ||
 | |
| 	     ((c >= 0x200C) && (c <= 0x200D)) ||
 | |
| 	     ((c >= 0x2070) && (c <= 0x218F)) ||
 | |
| 	     ((c >= 0x2C00) && (c <= 0x2FEF)) ||
 | |
| 	     ((c >= 0x3001) && (c <= 0xD7FF)) ||
 | |
| 	     ((c >= 0xF900) && (c <= 0xFDCF)) ||
 | |
| 	     ((c >= 0xFDF0) && (c <= 0xFFFD)) ||
 | |
| 	     ((c >= 0x10000) && (c <= 0xEFFFF))))
 | |
| 	    return(1);
 | |
|     } else {
 | |
|         if (IS_LETTER(c) || (c == '_') || (c == ':'))
 | |
| 	    return(1);
 | |
|     }
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| static int
 | |
| xmlIsNameChar(xmlParserCtxtPtr ctxt, int c) {
 | |
|     if ((ctxt->options & XML_PARSE_OLD10) == 0) {
 | |
|         /*
 | |
| 	 * Use the new checks of production [4] [4a] amd [5] of the
 | |
| 	 * Update 5 of XML-1.0
 | |
| 	 */
 | |
| 	if ((c != ' ') && (c != '>') && (c != '/') && /* accelerators */
 | |
| 	    (((c >= 'a') && (c <= 'z')) ||
 | |
| 	     ((c >= 'A') && (c <= 'Z')) ||
 | |
| 	     ((c >= '0') && (c <= '9')) || /* !start */
 | |
| 	     (c == '_') || (c == ':') ||
 | |
| 	     (c == '-') || (c == '.') || (c == 0xB7) || /* !start */
 | |
| 	     ((c >= 0xC0) && (c <= 0xD6)) ||
 | |
| 	     ((c >= 0xD8) && (c <= 0xF6)) ||
 | |
| 	     ((c >= 0xF8) && (c <= 0x2FF)) ||
 | |
| 	     ((c >= 0x300) && (c <= 0x36F)) || /* !start */
 | |
| 	     ((c >= 0x370) && (c <= 0x37D)) ||
 | |
| 	     ((c >= 0x37F) && (c <= 0x1FFF)) ||
 | |
| 	     ((c >= 0x200C) && (c <= 0x200D)) ||
 | |
| 	     ((c >= 0x203F) && (c <= 0x2040)) || /* !start */
 | |
| 	     ((c >= 0x2070) && (c <= 0x218F)) ||
 | |
| 	     ((c >= 0x2C00) && (c <= 0x2FEF)) ||
 | |
| 	     ((c >= 0x3001) && (c <= 0xD7FF)) ||
 | |
| 	     ((c >= 0xF900) && (c <= 0xFDCF)) ||
 | |
| 	     ((c >= 0xFDF0) && (c <= 0xFFFD)) ||
 | |
| 	     ((c >= 0x10000) && (c <= 0xEFFFF))))
 | |
| 	     return(1);
 | |
|     } else {
 | |
|         if ((IS_LETTER(c)) || (IS_DIGIT(c)) ||
 | |
|             (c == '.') || (c == '-') ||
 | |
| 	    (c == '_') || (c == ':') ||
 | |
| 	    (IS_COMBINING(c)) ||
 | |
| 	    (IS_EXTENDER(c)))
 | |
| 	    return(1);
 | |
|     }
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| static xmlChar * xmlParseAttValueInternal(xmlParserCtxtPtr ctxt,
 | |
|                                           int *len, int *alloc, int normalize);
 | |
| 
 | |
| static const xmlChar *
 | |
| xmlParseNameComplex(xmlParserCtxtPtr ctxt) {
 | |
|     int len = 0, l;
 | |
|     int c;
 | |
|     int maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                     XML_MAX_TEXT_LENGTH :
 | |
|                     XML_MAX_NAME_LENGTH;
 | |
| 
 | |
|     /*
 | |
|      * Handler for more complex cases
 | |
|      */
 | |
|     c = CUR_CHAR(l);
 | |
|     if ((ctxt->options & XML_PARSE_OLD10) == 0) {
 | |
|         /*
 | |
| 	 * Use the new checks of production [4] [4a] amd [5] of the
 | |
| 	 * Update 5 of XML-1.0
 | |
| 	 */
 | |
| 	if ((c == ' ') || (c == '>') || (c == '/') || /* accelerators */
 | |
| 	    (!(((c >= 'a') && (c <= 'z')) ||
 | |
| 	       ((c >= 'A') && (c <= 'Z')) ||
 | |
| 	       (c == '_') || (c == ':') ||
 | |
| 	       ((c >= 0xC0) && (c <= 0xD6)) ||
 | |
| 	       ((c >= 0xD8) && (c <= 0xF6)) ||
 | |
| 	       ((c >= 0xF8) && (c <= 0x2FF)) ||
 | |
| 	       ((c >= 0x370) && (c <= 0x37D)) ||
 | |
| 	       ((c >= 0x37F) && (c <= 0x1FFF)) ||
 | |
| 	       ((c >= 0x200C) && (c <= 0x200D)) ||
 | |
| 	       ((c >= 0x2070) && (c <= 0x218F)) ||
 | |
| 	       ((c >= 0x2C00) && (c <= 0x2FEF)) ||
 | |
| 	       ((c >= 0x3001) && (c <= 0xD7FF)) ||
 | |
| 	       ((c >= 0xF900) && (c <= 0xFDCF)) ||
 | |
| 	       ((c >= 0xFDF0) && (c <= 0xFFFD)) ||
 | |
| 	       ((c >= 0x10000) && (c <= 0xEFFFF))))) {
 | |
| 	    return(NULL);
 | |
| 	}
 | |
| 	len += l;
 | |
| 	NEXTL(l);
 | |
| 	c = CUR_CHAR(l);
 | |
| 	while ((c != ' ') && (c != '>') && (c != '/') && /* accelerators */
 | |
| 	       (((c >= 'a') && (c <= 'z')) ||
 | |
| 	        ((c >= 'A') && (c <= 'Z')) ||
 | |
| 	        ((c >= '0') && (c <= '9')) || /* !start */
 | |
| 	        (c == '_') || (c == ':') ||
 | |
| 	        (c == '-') || (c == '.') || (c == 0xB7) || /* !start */
 | |
| 	        ((c >= 0xC0) && (c <= 0xD6)) ||
 | |
| 	        ((c >= 0xD8) && (c <= 0xF6)) ||
 | |
| 	        ((c >= 0xF8) && (c <= 0x2FF)) ||
 | |
| 	        ((c >= 0x300) && (c <= 0x36F)) || /* !start */
 | |
| 	        ((c >= 0x370) && (c <= 0x37D)) ||
 | |
| 	        ((c >= 0x37F) && (c <= 0x1FFF)) ||
 | |
| 	        ((c >= 0x200C) && (c <= 0x200D)) ||
 | |
| 	        ((c >= 0x203F) && (c <= 0x2040)) || /* !start */
 | |
| 	        ((c >= 0x2070) && (c <= 0x218F)) ||
 | |
| 	        ((c >= 0x2C00) && (c <= 0x2FEF)) ||
 | |
| 	        ((c >= 0x3001) && (c <= 0xD7FF)) ||
 | |
| 	        ((c >= 0xF900) && (c <= 0xFDCF)) ||
 | |
| 	        ((c >= 0xFDF0) && (c <= 0xFFFD)) ||
 | |
| 	        ((c >= 0x10000) && (c <= 0xEFFFF))
 | |
| 		)) {
 | |
|             if (len <= INT_MAX - l)
 | |
| 	        len += l;
 | |
| 	    NEXTL(l);
 | |
| 	    c = CUR_CHAR(l);
 | |
| 	}
 | |
|     } else {
 | |
| 	if ((c == ' ') || (c == '>') || (c == '/') || /* accelerators */
 | |
| 	    (!IS_LETTER(c) && (c != '_') &&
 | |
| 	     (c != ':'))) {
 | |
| 	    return(NULL);
 | |
| 	}
 | |
| 	len += l;
 | |
| 	NEXTL(l);
 | |
| 	c = CUR_CHAR(l);
 | |
| 
 | |
| 	while ((c != ' ') && (c != '>') && (c != '/') && /* test bigname.xml */
 | |
| 	       ((IS_LETTER(c)) || (IS_DIGIT(c)) ||
 | |
| 		(c == '.') || (c == '-') ||
 | |
| 		(c == '_') || (c == ':') ||
 | |
| 		(IS_COMBINING(c)) ||
 | |
| 		(IS_EXTENDER(c)))) {
 | |
|             if (len <= INT_MAX - l)
 | |
| 	        len += l;
 | |
| 	    NEXTL(l);
 | |
| 	    c = CUR_CHAR(l);
 | |
| 	}
 | |
|     }
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return(NULL);
 | |
|     if (len > maxLength) {
 | |
|         xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "Name");
 | |
|         return(NULL);
 | |
|     }
 | |
|     if (ctxt->input->cur - ctxt->input->base < len) {
 | |
|         /*
 | |
|          * There were a couple of bugs where PERefs lead to to a change
 | |
|          * of the buffer. Check the buffer size to avoid passing an invalid
 | |
|          * pointer to xmlDictLookup.
 | |
|          */
 | |
|         xmlFatalErr(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
|                     "unexpected change of input buffer");
 | |
|         return (NULL);
 | |
|     }
 | |
|     if ((*ctxt->input->cur == '\n') && (ctxt->input->cur[-1] == '\r'))
 | |
|         return(xmlDictLookup(ctxt->dict, ctxt->input->cur - (len + 1), len));
 | |
|     return(xmlDictLookup(ctxt->dict, ctxt->input->cur - len, len));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseName:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an XML name.
 | |
|  *
 | |
|  * [4] NameChar ::= Letter | Digit | '.' | '-' | '_' | ':' |
 | |
|  *                  CombiningChar | Extender
 | |
|  *
 | |
|  * [5] Name ::= (Letter | '_' | ':') (NameChar)*
 | |
|  *
 | |
|  * [6] Names ::= Name (#x20 Name)*
 | |
|  *
 | |
|  * Returns the Name parsed or NULL
 | |
|  */
 | |
| 
 | |
| const xmlChar *
 | |
| xmlParseName(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *in;
 | |
|     const xmlChar *ret;
 | |
|     size_t count = 0;
 | |
|     size_t maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                        XML_MAX_TEXT_LENGTH :
 | |
|                        XML_MAX_NAME_LENGTH;
 | |
| 
 | |
|     GROW;
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return(NULL);
 | |
| 
 | |
|     /*
 | |
|      * Accelerator for simple ASCII names
 | |
|      */
 | |
|     in = ctxt->input->cur;
 | |
|     if (((*in >= 0x61) && (*in <= 0x7A)) ||
 | |
| 	((*in >= 0x41) && (*in <= 0x5A)) ||
 | |
| 	(*in == '_') || (*in == ':')) {
 | |
| 	in++;
 | |
| 	while (((*in >= 0x61) && (*in <= 0x7A)) ||
 | |
| 	       ((*in >= 0x41) && (*in <= 0x5A)) ||
 | |
| 	       ((*in >= 0x30) && (*in <= 0x39)) ||
 | |
| 	       (*in == '_') || (*in == '-') ||
 | |
| 	       (*in == ':') || (*in == '.'))
 | |
| 	    in++;
 | |
| 	if ((*in > 0) && (*in < 0x80)) {
 | |
| 	    count = in - ctxt->input->cur;
 | |
|             if (count > maxLength) {
 | |
|                 xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "Name");
 | |
|                 return(NULL);
 | |
|             }
 | |
| 	    ret = xmlDictLookup(ctxt->dict, ctxt->input->cur, count);
 | |
| 	    ctxt->input->cur = in;
 | |
| 	    ctxt->input->col += count;
 | |
| 	    if (ret == NULL)
 | |
| 	        xmlErrMemory(ctxt, NULL);
 | |
| 	    return(ret);
 | |
| 	}
 | |
|     }
 | |
|     /* accelerator for special cases */
 | |
|     return(xmlParseNameComplex(ctxt));
 | |
| }
 | |
| 
 | |
| static xmlHashedString
 | |
| xmlParseNCNameComplex(xmlParserCtxtPtr ctxt) {
 | |
|     xmlHashedString ret;
 | |
|     int len = 0, l;
 | |
|     int c;
 | |
|     int maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                     XML_MAX_TEXT_LENGTH :
 | |
|                     XML_MAX_NAME_LENGTH;
 | |
|     size_t startPosition = 0;
 | |
| 
 | |
|     ret.name = NULL;
 | |
|     ret.hashValue = 0;
 | |
| 
 | |
|     /*
 | |
|      * Handler for more complex cases
 | |
|      */
 | |
|     startPosition = CUR_PTR - BASE_PTR;
 | |
|     c = CUR_CHAR(l);
 | |
|     if ((c == ' ') || (c == '>') || (c == '/') || /* accelerators */
 | |
| 	(!xmlIsNameStartChar(ctxt, c) || (c == ':'))) {
 | |
| 	return(ret);
 | |
|     }
 | |
| 
 | |
|     while ((c != ' ') && (c != '>') && (c != '/') && /* test bigname.xml */
 | |
| 	   (xmlIsNameChar(ctxt, c) && (c != ':'))) {
 | |
|         if (len <= INT_MAX - l)
 | |
| 	    len += l;
 | |
| 	NEXTL(l);
 | |
| 	c = CUR_CHAR(l);
 | |
|     }
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return(ret);
 | |
|     if (len > maxLength) {
 | |
|         xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NCName");
 | |
|         return(ret);
 | |
|     }
 | |
|     ret = xmlDictLookupHashed(ctxt->dict, (BASE_PTR + startPosition), len);
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseNCName:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @len:  length of the string parsed
 | |
|  *
 | |
|  * parse an XML name.
 | |
|  *
 | |
|  * [4NS] NCNameChar ::= Letter | Digit | '.' | '-' | '_' |
 | |
|  *                      CombiningChar | Extender
 | |
|  *
 | |
|  * [5NS] NCName ::= (Letter | '_') (NCNameChar)*
 | |
|  *
 | |
|  * Returns the Name parsed or NULL
 | |
|  */
 | |
| 
 | |
| static xmlHashedString
 | |
| xmlParseNCName(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *in, *e;
 | |
|     xmlHashedString ret;
 | |
|     size_t count = 0;
 | |
|     size_t maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                        XML_MAX_TEXT_LENGTH :
 | |
|                        XML_MAX_NAME_LENGTH;
 | |
| 
 | |
|     ret.name = NULL;
 | |
| 
 | |
|     /*
 | |
|      * Accelerator for simple ASCII names
 | |
|      */
 | |
|     in = ctxt->input->cur;
 | |
|     e = ctxt->input->end;
 | |
|     if ((((*in >= 0x61) && (*in <= 0x7A)) ||
 | |
| 	 ((*in >= 0x41) && (*in <= 0x5A)) ||
 | |
| 	 (*in == '_')) && (in < e)) {
 | |
| 	in++;
 | |
| 	while ((((*in >= 0x61) && (*in <= 0x7A)) ||
 | |
| 	        ((*in >= 0x41) && (*in <= 0x5A)) ||
 | |
| 	        ((*in >= 0x30) && (*in <= 0x39)) ||
 | |
| 	        (*in == '_') || (*in == '-') ||
 | |
| 	        (*in == '.')) && (in < e))
 | |
| 	    in++;
 | |
| 	if (in >= e)
 | |
| 	    goto complex;
 | |
| 	if ((*in > 0) && (*in < 0x80)) {
 | |
| 	    count = in - ctxt->input->cur;
 | |
|             if (count > maxLength) {
 | |
|                 xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NCName");
 | |
|                 return(ret);
 | |
|             }
 | |
| 	    ret = xmlDictLookupHashed(ctxt->dict, ctxt->input->cur, count);
 | |
| 	    ctxt->input->cur = in;
 | |
| 	    ctxt->input->col += count;
 | |
| 	    if (ret.name == NULL) {
 | |
| 	        xmlErrMemory(ctxt, NULL);
 | |
| 	    }
 | |
| 	    return(ret);
 | |
| 	}
 | |
|     }
 | |
| complex:
 | |
|     return(xmlParseNCNameComplex(ctxt));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseNameAndCompare:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * parse an XML name and compares for match
 | |
|  * (specialized for endtag parsing)
 | |
|  *
 | |
|  * Returns NULL for an illegal name, (xmlChar*) 1 for success
 | |
|  * and the name for mismatch
 | |
|  */
 | |
| 
 | |
| static const xmlChar *
 | |
| xmlParseNameAndCompare(xmlParserCtxtPtr ctxt, xmlChar const *other) {
 | |
|     register const xmlChar *cmp = other;
 | |
|     register const xmlChar *in;
 | |
|     const xmlChar *ret;
 | |
| 
 | |
|     GROW;
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return(NULL);
 | |
| 
 | |
|     in = ctxt->input->cur;
 | |
|     while (*in != 0 && *in == *cmp) {
 | |
| 	++in;
 | |
| 	++cmp;
 | |
|     }
 | |
|     if (*cmp == 0 && (*in == '>' || IS_BLANK_CH (*in))) {
 | |
| 	/* success */
 | |
| 	ctxt->input->col += in - ctxt->input->cur;
 | |
| 	ctxt->input->cur = in;
 | |
| 	return (const xmlChar*) 1;
 | |
|     }
 | |
|     /* failure (or end of input buffer), check with full function */
 | |
|     ret = xmlParseName (ctxt);
 | |
|     /* strings coming from the dictionary direct compare possible */
 | |
|     if (ret == other) {
 | |
| 	return (const xmlChar*) 1;
 | |
|     }
 | |
|     return ret;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseStringName:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @str:  a pointer to the string pointer (IN/OUT)
 | |
|  *
 | |
|  * parse an XML name.
 | |
|  *
 | |
|  * [4] NameChar ::= Letter | Digit | '.' | '-' | '_' | ':' |
 | |
|  *                  CombiningChar | Extender
 | |
|  *
 | |
|  * [5] Name ::= (Letter | '_' | ':') (NameChar)*
 | |
|  *
 | |
|  * [6] Names ::= Name (#x20 Name)*
 | |
|  *
 | |
|  * Returns the Name parsed or NULL. The @str pointer
 | |
|  * is updated to the current location in the string.
 | |
|  */
 | |
| 
 | |
| static xmlChar *
 | |
| xmlParseStringName(xmlParserCtxtPtr ctxt, const xmlChar** str) {
 | |
|     xmlChar buf[XML_MAX_NAMELEN + 5];
 | |
|     const xmlChar *cur = *str;
 | |
|     int len = 0, l;
 | |
|     int c;
 | |
|     int maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                     XML_MAX_TEXT_LENGTH :
 | |
|                     XML_MAX_NAME_LENGTH;
 | |
| 
 | |
|     c = CUR_SCHAR(cur, l);
 | |
|     if (!xmlIsNameStartChar(ctxt, c)) {
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     COPY_BUF(buf, len, c);
 | |
|     cur += l;
 | |
|     c = CUR_SCHAR(cur, l);
 | |
|     while (xmlIsNameChar(ctxt, c)) {
 | |
| 	COPY_BUF(buf, len, c);
 | |
| 	cur += l;
 | |
| 	c = CUR_SCHAR(cur, l);
 | |
| 	if (len >= XML_MAX_NAMELEN) { /* test bigentname.xml */
 | |
| 	    /*
 | |
| 	     * Okay someone managed to make a huge name, so he's ready to pay
 | |
| 	     * for the processing speed.
 | |
| 	     */
 | |
| 	    xmlChar *buffer;
 | |
| 	    int max = len * 2;
 | |
| 
 | |
| 	    buffer = (xmlChar *) xmlMallocAtomic(max);
 | |
| 	    if (buffer == NULL) {
 | |
| 	        xmlErrMemory(ctxt, NULL);
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    memcpy(buffer, buf, len);
 | |
| 	    while (xmlIsNameChar(ctxt, c)) {
 | |
| 		if (len + 10 > max) {
 | |
| 		    xmlChar *tmp;
 | |
| 
 | |
| 		    max *= 2;
 | |
| 		    tmp = (xmlChar *) xmlRealloc(buffer, max);
 | |
| 		    if (tmp == NULL) {
 | |
| 			xmlErrMemory(ctxt, NULL);
 | |
| 			xmlFree(buffer);
 | |
| 			return(NULL);
 | |
| 		    }
 | |
| 		    buffer = tmp;
 | |
| 		}
 | |
| 		COPY_BUF(buffer, len, c);
 | |
| 		cur += l;
 | |
| 		c = CUR_SCHAR(cur, l);
 | |
|                 if (len > maxLength) {
 | |
|                     xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NCName");
 | |
|                     xmlFree(buffer);
 | |
|                     return(NULL);
 | |
|                 }
 | |
| 	    }
 | |
| 	    buffer[len] = 0;
 | |
| 	    *str = cur;
 | |
| 	    return(buffer);
 | |
| 	}
 | |
|     }
 | |
|     if (len > maxLength) {
 | |
|         xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NCName");
 | |
|         return(NULL);
 | |
|     }
 | |
|     *str = cur;
 | |
|     return(xmlStrndup(buf, len));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseNmtoken:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an XML Nmtoken.
 | |
|  *
 | |
|  * [7] Nmtoken ::= (NameChar)+
 | |
|  *
 | |
|  * [8] Nmtokens ::= Nmtoken (#x20 Nmtoken)*
 | |
|  *
 | |
|  * Returns the Nmtoken parsed or NULL
 | |
|  */
 | |
| 
 | |
| xmlChar *
 | |
| xmlParseNmtoken(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar buf[XML_MAX_NAMELEN + 5];
 | |
|     int len = 0, l;
 | |
|     int c;
 | |
|     int maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                     XML_MAX_TEXT_LENGTH :
 | |
|                     XML_MAX_NAME_LENGTH;
 | |
| 
 | |
|     c = CUR_CHAR(l);
 | |
| 
 | |
|     while (xmlIsNameChar(ctxt, c)) {
 | |
| 	COPY_BUF(buf, len, c);
 | |
| 	NEXTL(l);
 | |
| 	c = CUR_CHAR(l);
 | |
| 	if (len >= XML_MAX_NAMELEN) {
 | |
| 	    /*
 | |
| 	     * Okay someone managed to make a huge token, so he's ready to pay
 | |
| 	     * for the processing speed.
 | |
| 	     */
 | |
| 	    xmlChar *buffer;
 | |
| 	    int max = len * 2;
 | |
| 
 | |
| 	    buffer = (xmlChar *) xmlMallocAtomic(max);
 | |
| 	    if (buffer == NULL) {
 | |
| 	        xmlErrMemory(ctxt, NULL);
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    memcpy(buffer, buf, len);
 | |
| 	    while (xmlIsNameChar(ctxt, c)) {
 | |
| 		if (len + 10 > max) {
 | |
| 		    xmlChar *tmp;
 | |
| 
 | |
| 		    max *= 2;
 | |
| 		    tmp = (xmlChar *) xmlRealloc(buffer, max);
 | |
| 		    if (tmp == NULL) {
 | |
| 			xmlErrMemory(ctxt, NULL);
 | |
| 			xmlFree(buffer);
 | |
| 			return(NULL);
 | |
| 		    }
 | |
| 		    buffer = tmp;
 | |
| 		}
 | |
| 		COPY_BUF(buffer, len, c);
 | |
|                 if (len > maxLength) {
 | |
|                     xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NmToken");
 | |
|                     xmlFree(buffer);
 | |
|                     return(NULL);
 | |
|                 }
 | |
| 		NEXTL(l);
 | |
| 		c = CUR_CHAR(l);
 | |
| 	    }
 | |
| 	    buffer[len] = 0;
 | |
|             if (ctxt->instate == XML_PARSER_EOF) {
 | |
|                 xmlFree(buffer);
 | |
|                 return(NULL);
 | |
|             }
 | |
| 	    return(buffer);
 | |
| 	}
 | |
|     }
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return(NULL);
 | |
|     if (len == 0)
 | |
|         return(NULL);
 | |
|     if (len > maxLength) {
 | |
|         xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NmToken");
 | |
|         return(NULL);
 | |
|     }
 | |
|     return(xmlStrndup(buf, len));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseEntityValue:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @orig:  if non-NULL store a copy of the original entity value
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse a value for ENTITY declarations
 | |
|  *
 | |
|  * [9] EntityValue ::= '"' ([^%&"] | PEReference | Reference)* '"' |
 | |
|  *	               "'" ([^%&'] | PEReference | Reference)* "'"
 | |
|  *
 | |
|  * Returns the EntityValue parsed with reference substituted or NULL
 | |
|  */
 | |
| 
 | |
| xmlChar *
 | |
| xmlParseEntityValue(xmlParserCtxtPtr ctxt, xmlChar **orig) {
 | |
|     xmlChar *buf = NULL;
 | |
|     int len = 0;
 | |
|     int size = XML_PARSER_BUFFER_SIZE;
 | |
|     int c, l;
 | |
|     int maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                     XML_MAX_HUGE_LENGTH :
 | |
|                     XML_MAX_TEXT_LENGTH;
 | |
|     xmlChar stop;
 | |
|     xmlChar *ret = NULL;
 | |
|     const xmlChar *cur = NULL;
 | |
|     xmlParserInputPtr input;
 | |
| 
 | |
|     if (RAW == '"') stop = '"';
 | |
|     else if (RAW == '\'') stop = '\'';
 | |
|     else {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_ENTITY_NOT_STARTED, NULL);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     buf = (xmlChar *) xmlMallocAtomic(size);
 | |
|     if (buf == NULL) {
 | |
| 	xmlErrMemory(ctxt, NULL);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * The content of the entity definition is copied in a buffer.
 | |
|      */
 | |
| 
 | |
|     ctxt->instate = XML_PARSER_ENTITY_VALUE;
 | |
|     input = ctxt->input;
 | |
|     GROW;
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         goto error;
 | |
|     NEXT;
 | |
|     c = CUR_CHAR(l);
 | |
|     /*
 | |
|      * NOTE: 4.4.5 Included in Literal
 | |
|      * When a parameter entity reference appears in a literal entity
 | |
|      * value, ... a single or double quote character in the replacement
 | |
|      * text is always treated as a normal data character and will not
 | |
|      * terminate the literal.
 | |
|      * In practice it means we stop the loop only when back at parsing
 | |
|      * the initial entity and the quote is found
 | |
|      */
 | |
|     while (((IS_CHAR(c)) && ((c != stop) || /* checked */
 | |
| 	    (ctxt->input != input))) && (ctxt->instate != XML_PARSER_EOF)) {
 | |
| 	if (len + 5 >= size) {
 | |
| 	    xmlChar *tmp;
 | |
| 
 | |
| 	    size *= 2;
 | |
| 	    tmp = (xmlChar *) xmlRealloc(buf, size);
 | |
| 	    if (tmp == NULL) {
 | |
| 		xmlErrMemory(ctxt, NULL);
 | |
|                 goto error;
 | |
| 	    }
 | |
| 	    buf = tmp;
 | |
| 	}
 | |
| 	COPY_BUF(buf, len, c);
 | |
| 	NEXTL(l);
 | |
| 
 | |
| 	GROW;
 | |
| 	c = CUR_CHAR(l);
 | |
| 	if (c == 0) {
 | |
| 	    GROW;
 | |
| 	    c = CUR_CHAR(l);
 | |
| 	}
 | |
| 
 | |
|         if (len > maxLength) {
 | |
|             xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_NOT_FINISHED,
 | |
|                            "entity value too long\n");
 | |
|             goto error;
 | |
|         }
 | |
|     }
 | |
|     buf[len] = 0;
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         goto error;
 | |
|     if (c != stop) {
 | |
|         xmlFatalErr(ctxt, XML_ERR_ENTITY_NOT_FINISHED, NULL);
 | |
|         goto error;
 | |
|     }
 | |
|     NEXT;
 | |
| 
 | |
|     /*
 | |
|      * Raise problem w.r.t. '&' and '%' being used in non-entities
 | |
|      * reference constructs. Note Charref will be handled in
 | |
|      * xmlStringDecodeEntities()
 | |
|      */
 | |
|     cur = buf;
 | |
|     while (*cur != 0) { /* non input consuming */
 | |
| 	if ((*cur == '%') || ((*cur == '&') && (cur[1] != '#'))) {
 | |
| 	    xmlChar *name;
 | |
| 	    xmlChar tmp = *cur;
 | |
|             int nameOk = 0;
 | |
| 
 | |
| 	    cur++;
 | |
| 	    name = xmlParseStringName(ctxt, &cur);
 | |
|             if (name != NULL) {
 | |
|                 nameOk = 1;
 | |
|                 xmlFree(name);
 | |
|             }
 | |
|             if ((nameOk == 0) || (*cur != ';')) {
 | |
| 		xmlFatalErrMsgInt(ctxt, XML_ERR_ENTITY_CHAR_ERROR,
 | |
| 	    "EntityValue: '%c' forbidden except for entities references\n",
 | |
| 	                          tmp);
 | |
|                 goto error;
 | |
| 	    }
 | |
| 	    if ((tmp == '%') && (ctxt->inSubset == 1) &&
 | |
| 		(ctxt->inputNr == 1)) {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_ENTITY_PE_INTERNAL, NULL);
 | |
|                 goto error;
 | |
| 	    }
 | |
| 	    if (*cur == 0)
 | |
| 	        break;
 | |
| 	}
 | |
| 	cur++;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Then PEReference entities are substituted.
 | |
|      *
 | |
|      * NOTE: 4.4.7 Bypassed
 | |
|      * When a general entity reference appears in the EntityValue in
 | |
|      * an entity declaration, it is bypassed and left as is.
 | |
|      * so XML_SUBSTITUTE_REF is not set here.
 | |
|      */
 | |
|     ++ctxt->depth;
 | |
|     ret = xmlStringDecodeEntitiesInt(ctxt, buf, len, XML_SUBSTITUTE_PEREF,
 | |
|                                      0, 0, 0, /* check */ 1);
 | |
|     --ctxt->depth;
 | |
| 
 | |
|     if (orig != NULL) {
 | |
|         *orig = buf;
 | |
|         buf = NULL;
 | |
|     }
 | |
| 
 | |
| error:
 | |
|     if (buf != NULL)
 | |
|         xmlFree(buf);
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseAttValueComplex:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @len:   the resulting attribute len
 | |
|  * @normalize:  whether to apply the inner normalization
 | |
|  *
 | |
|  * parse a value for an attribute, this is the fallback function
 | |
|  * of xmlParseAttValue() when the attribute parsing requires handling
 | |
|  * of non-ASCII characters, or normalization compaction.
 | |
|  *
 | |
|  * Returns the AttValue parsed or NULL. The value has to be freed by the caller.
 | |
|  */
 | |
| static xmlChar *
 | |
| xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {
 | |
|     xmlChar limit = 0;
 | |
|     xmlChar *buf = NULL;
 | |
|     xmlChar *rep = NULL;
 | |
|     size_t len = 0;
 | |
|     size_t buf_size = 0;
 | |
|     size_t maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                        XML_MAX_HUGE_LENGTH :
 | |
|                        XML_MAX_TEXT_LENGTH;
 | |
|     int c, l, in_space = 0;
 | |
|     xmlChar *current = NULL;
 | |
|     xmlEntityPtr ent;
 | |
| 
 | |
|     if (NXT(0) == '"') {
 | |
| 	ctxt->instate = XML_PARSER_ATTRIBUTE_VALUE;
 | |
| 	limit = '"';
 | |
|         NEXT;
 | |
|     } else if (NXT(0) == '\'') {
 | |
| 	limit = '\'';
 | |
| 	ctxt->instate = XML_PARSER_ATTRIBUTE_VALUE;
 | |
|         NEXT;
 | |
|     } else {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_ATTRIBUTE_NOT_STARTED, NULL);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * allocate a translation buffer.
 | |
|      */
 | |
|     buf_size = XML_PARSER_BUFFER_SIZE;
 | |
|     buf = (xmlChar *) xmlMallocAtomic(buf_size);
 | |
|     if (buf == NULL) goto mem_error;
 | |
| 
 | |
|     /*
 | |
|      * OK loop until we reach one of the ending char or a size limit.
 | |
|      */
 | |
|     c = CUR_CHAR(l);
 | |
|     while (((NXT(0) != limit) && /* checked */
 | |
|             (IS_CHAR(c)) && (c != '<')) &&
 | |
|             (ctxt->instate != XML_PARSER_EOF)) {
 | |
| 	if (c == '&') {
 | |
| 	    in_space = 0;
 | |
| 	    if (NXT(1) == '#') {
 | |
| 		int val = xmlParseCharRef(ctxt);
 | |
| 
 | |
| 		if (val == '&') {
 | |
| 		    if (ctxt->replaceEntities) {
 | |
| 			if (len + 10 > buf_size) {
 | |
| 			    growBuffer(buf, 10);
 | |
| 			}
 | |
| 			buf[len++] = '&';
 | |
| 		    } else {
 | |
| 			/*
 | |
| 			 * The reparsing will be done in xmlStringGetNodeList()
 | |
| 			 * called by the attribute() function in SAX.c
 | |
| 			 */
 | |
| 			if (len + 10 > buf_size) {
 | |
| 			    growBuffer(buf, 10);
 | |
| 			}
 | |
| 			buf[len++] = '&';
 | |
| 			buf[len++] = '#';
 | |
| 			buf[len++] = '3';
 | |
| 			buf[len++] = '8';
 | |
| 			buf[len++] = ';';
 | |
| 		    }
 | |
| 		} else if (val != 0) {
 | |
| 		    if (len + 10 > buf_size) {
 | |
| 			growBuffer(buf, 10);
 | |
| 		    }
 | |
| 		    len += xmlCopyChar(0, &buf[len], val);
 | |
| 		}
 | |
| 	    } else {
 | |
| 		ent = xmlParseEntityRef(ctxt);
 | |
| 		if ((ent != NULL) &&
 | |
| 		    (ent->etype == XML_INTERNAL_PREDEFINED_ENTITY)) {
 | |
| 		    if (len + 10 > buf_size) {
 | |
| 			growBuffer(buf, 10);
 | |
| 		    }
 | |
| 		    if ((ctxt->replaceEntities == 0) &&
 | |
| 		        (ent->content[0] == '&')) {
 | |
| 			buf[len++] = '&';
 | |
| 			buf[len++] = '#';
 | |
| 			buf[len++] = '3';
 | |
| 			buf[len++] = '8';
 | |
| 			buf[len++] = ';';
 | |
| 		    } else {
 | |
| 			buf[len++] = ent->content[0];
 | |
| 		    }
 | |
| 		} else if ((ent != NULL) &&
 | |
| 		           (ctxt->replaceEntities != 0)) {
 | |
| 		    if (ent->etype != XML_INTERNAL_PREDEFINED_ENTITY) {
 | |
|                         if (xmlParserEntityCheck(ctxt, ent->length))
 | |
|                             goto error;
 | |
| 
 | |
| 			++ctxt->depth;
 | |
| 			rep = xmlStringDecodeEntitiesInt(ctxt, ent->content,
 | |
|                                 ent->length, XML_SUBSTITUTE_REF, 0, 0, 0,
 | |
|                                 /* check */ 1);
 | |
| 			--ctxt->depth;
 | |
| 			if (rep != NULL) {
 | |
| 			    current = rep;
 | |
| 			    while (*current != 0) { /* non input consuming */
 | |
|                                 if ((*current == 0xD) || (*current == 0xA) ||
 | |
|                                     (*current == 0x9)) {
 | |
|                                     buf[len++] = 0x20;
 | |
|                                     current++;
 | |
|                                 } else
 | |
|                                     buf[len++] = *current++;
 | |
| 				if (len + 10 > buf_size) {
 | |
| 				    growBuffer(buf, 10);
 | |
| 				}
 | |
| 			    }
 | |
| 			    xmlFree(rep);
 | |
| 			    rep = NULL;
 | |
| 			}
 | |
| 		    } else {
 | |
| 			if (len + 10 > buf_size) {
 | |
| 			    growBuffer(buf, 10);
 | |
| 			}
 | |
| 			if (ent->content != NULL)
 | |
| 			    buf[len++] = ent->content[0];
 | |
| 		    }
 | |
| 		} else if (ent != NULL) {
 | |
| 		    int i = xmlStrlen(ent->name);
 | |
| 		    const xmlChar *cur = ent->name;
 | |
| 
 | |
| 		    /*
 | |
|                      * We also check for recursion and amplification
 | |
|                      * when entities are not substituted. They're
 | |
|                      * often expanded later.
 | |
| 		     */
 | |
| 		    if ((ent->etype != XML_INTERNAL_PREDEFINED_ENTITY) &&
 | |
| 			(ent->content != NULL)) {
 | |
|                         if ((ent->flags & XML_ENT_CHECKED) == 0) {
 | |
|                             unsigned long oldCopy = ctxt->sizeentcopy;
 | |
| 
 | |
|                             ctxt->sizeentcopy = ent->length;
 | |
| 
 | |
|                             ++ctxt->depth;
 | |
|                             rep = xmlStringDecodeEntitiesInt(ctxt,
 | |
|                                     ent->content, ent->length,
 | |
|                                     XML_SUBSTITUTE_REF, 0, 0, 0,
 | |
|                                     /* check */ 1);
 | |
|                             --ctxt->depth;
 | |
| 
 | |
|                             /*
 | |
|                              * If we're parsing DTD content, the entity
 | |
|                              * might reference other entities which
 | |
|                              * weren't defined yet, so the check isn't
 | |
|                              * reliable.
 | |
|                              */
 | |
|                             if (ctxt->inSubset == 0) {
 | |
|                                 ent->flags |= XML_ENT_CHECKED;
 | |
|                                 ent->expandedSize = ctxt->sizeentcopy;
 | |
|                             }
 | |
| 
 | |
|                             if (rep != NULL) {
 | |
|                                 xmlFree(rep);
 | |
|                                 rep = NULL;
 | |
|                             } else {
 | |
|                                 ent->content[0] = 0;
 | |
|                             }
 | |
| 
 | |
|                             if (xmlParserEntityCheck(ctxt, oldCopy))
 | |
|                                 goto error;
 | |
|                         } else {
 | |
|                             if (xmlParserEntityCheck(ctxt, ent->expandedSize))
 | |
|                                 goto error;
 | |
|                         }
 | |
| 		    }
 | |
| 
 | |
| 		    /*
 | |
| 		     * Just output the reference
 | |
| 		     */
 | |
| 		    buf[len++] = '&';
 | |
| 		    while (len + i + 10 > buf_size) {
 | |
| 			growBuffer(buf, i + 10);
 | |
| 		    }
 | |
| 		    for (;i > 0;i--)
 | |
| 			buf[len++] = *cur++;
 | |
| 		    buf[len++] = ';';
 | |
| 		}
 | |
| 	    }
 | |
| 	} else {
 | |
| 	    if ((c == 0x20) || (c == 0xD) || (c == 0xA) || (c == 0x9)) {
 | |
| 	        if ((len != 0) || (!normalize)) {
 | |
| 		    if ((!normalize) || (!in_space)) {
 | |
| 			COPY_BUF(buf, len, 0x20);
 | |
| 			while (len + 10 > buf_size) {
 | |
| 			    growBuffer(buf, 10);
 | |
| 			}
 | |
| 		    }
 | |
| 		    in_space = 1;
 | |
| 		}
 | |
| 	    } else {
 | |
| 	        in_space = 0;
 | |
| 		COPY_BUF(buf, len, c);
 | |
| 		if (len + 10 > buf_size) {
 | |
| 		    growBuffer(buf, 10);
 | |
| 		}
 | |
| 	    }
 | |
| 	    NEXTL(l);
 | |
| 	}
 | |
| 	GROW;
 | |
| 	c = CUR_CHAR(l);
 | |
|         if (len > maxLength) {
 | |
|             xmlFatalErrMsg(ctxt, XML_ERR_ATTRIBUTE_NOT_FINISHED,
 | |
|                            "AttValue length too long\n");
 | |
|             goto mem_error;
 | |
|         }
 | |
|     }
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         goto error;
 | |
| 
 | |
|     if ((in_space) && (normalize)) {
 | |
|         while ((len > 0) && (buf[len - 1] == 0x20)) len--;
 | |
|     }
 | |
|     buf[len] = 0;
 | |
|     if (RAW == '<') {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_LT_IN_ATTRIBUTE, NULL);
 | |
|     } else if (RAW != limit) {
 | |
| 	if ((c != 0) && (!IS_CHAR(c))) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_INVALID_CHAR,
 | |
| 			   "invalid character in attribute value\n");
 | |
| 	} else {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_ATTRIBUTE_NOT_FINISHED,
 | |
| 			   "AttValue: ' expected\n");
 | |
|         }
 | |
|     } else
 | |
| 	NEXT;
 | |
| 
 | |
|     if (attlen != NULL) *attlen = len;
 | |
|     return(buf);
 | |
| 
 | |
| mem_error:
 | |
|     xmlErrMemory(ctxt, NULL);
 | |
| error:
 | |
|     if (buf != NULL)
 | |
|         xmlFree(buf);
 | |
|     if (rep != NULL)
 | |
|         xmlFree(rep);
 | |
|     return(NULL);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseAttValue:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse a value for an attribute
 | |
|  * Note: the parser won't do substitution of entities here, this
 | |
|  * will be handled later in xmlStringGetNodeList
 | |
|  *
 | |
|  * [10] AttValue ::= '"' ([^<&"] | Reference)* '"' |
 | |
|  *                   "'" ([^<&'] | Reference)* "'"
 | |
|  *
 | |
|  * 3.3.3 Attribute-Value Normalization:
 | |
|  * Before the value of an attribute is passed to the application or
 | |
|  * checked for validity, the XML processor must normalize it as follows:
 | |
|  * - a character reference is processed by appending the referenced
 | |
|  *   character to the attribute value
 | |
|  * - an entity reference is processed by recursively processing the
 | |
|  *   replacement text of the entity
 | |
|  * - a whitespace character (#x20, #xD, #xA, #x9) is processed by
 | |
|  *   appending #x20 to the normalized value, except that only a single
 | |
|  *   #x20 is appended for a "#xD#xA" sequence that is part of an external
 | |
|  *   parsed entity or the literal entity value of an internal parsed entity
 | |
|  * - other characters are processed by appending them to the normalized value
 | |
|  * If the declared value is not CDATA, then the XML processor must further
 | |
|  * process the normalized attribute value by discarding any leading and
 | |
|  * trailing space (#x20) characters, and by replacing sequences of space
 | |
|  * (#x20) characters by a single space (#x20) character.
 | |
|  * All attributes for which no declaration has been read should be treated
 | |
|  * by a non-validating parser as if declared CDATA.
 | |
|  *
 | |
|  * Returns the AttValue parsed or NULL. The value has to be freed by the caller.
 | |
|  */
 | |
| 
 | |
| 
 | |
| xmlChar *
 | |
| xmlParseAttValue(xmlParserCtxtPtr ctxt) {
 | |
|     if ((ctxt == NULL) || (ctxt->input == NULL)) return(NULL);
 | |
|     return(xmlParseAttValueInternal(ctxt, NULL, NULL, 0));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseSystemLiteral:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an XML Literal
 | |
|  *
 | |
|  * [11] SystemLiteral ::= ('"' [^"]* '"') | ("'" [^']* "'")
 | |
|  *
 | |
|  * Returns the SystemLiteral parsed or NULL
 | |
|  */
 | |
| 
 | |
| xmlChar *
 | |
| xmlParseSystemLiteral(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar *buf = NULL;
 | |
|     int len = 0;
 | |
|     int size = XML_PARSER_BUFFER_SIZE;
 | |
|     int cur, l;
 | |
|     int maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                     XML_MAX_TEXT_LENGTH :
 | |
|                     XML_MAX_NAME_LENGTH;
 | |
|     xmlChar stop;
 | |
|     int state = ctxt->instate;
 | |
| 
 | |
|     if (RAW == '"') {
 | |
|         NEXT;
 | |
| 	stop = '"';
 | |
|     } else if (RAW == '\'') {
 | |
|         NEXT;
 | |
| 	stop = '\'';
 | |
|     } else {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_LITERAL_NOT_STARTED, NULL);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     buf = (xmlChar *) xmlMallocAtomic(size);
 | |
|     if (buf == NULL) {
 | |
|         xmlErrMemory(ctxt, NULL);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     ctxt->instate = XML_PARSER_SYSTEM_LITERAL;
 | |
|     cur = CUR_CHAR(l);
 | |
|     while ((IS_CHAR(cur)) && (cur != stop)) { /* checked */
 | |
| 	if (len + 5 >= size) {
 | |
| 	    xmlChar *tmp;
 | |
| 
 | |
| 	    size *= 2;
 | |
| 	    tmp = (xmlChar *) xmlRealloc(buf, size);
 | |
| 	    if (tmp == NULL) {
 | |
| 	        xmlFree(buf);
 | |
| 		xmlErrMemory(ctxt, NULL);
 | |
| 		ctxt->instate = (xmlParserInputState) state;
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    buf = tmp;
 | |
| 	}
 | |
| 	COPY_BUF(buf, len, cur);
 | |
|         if (len > maxLength) {
 | |
|             xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "SystemLiteral");
 | |
|             xmlFree(buf);
 | |
|             ctxt->instate = (xmlParserInputState) state;
 | |
|             return(NULL);
 | |
|         }
 | |
| 	NEXTL(l);
 | |
| 	cur = CUR_CHAR(l);
 | |
|     }
 | |
|     buf[len] = 0;
 | |
|     if (ctxt->instate == XML_PARSER_EOF) {
 | |
|         xmlFree(buf);
 | |
|         return(NULL);
 | |
|     }
 | |
|     ctxt->instate = (xmlParserInputState) state;
 | |
|     if (!IS_CHAR(cur)) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_LITERAL_NOT_FINISHED, NULL);
 | |
|     } else {
 | |
| 	NEXT;
 | |
|     }
 | |
|     return(buf);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParsePubidLiteral:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an XML public literal
 | |
|  *
 | |
|  * [12] PubidLiteral ::= '"' PubidChar* '"' | "'" (PubidChar - "'")* "'"
 | |
|  *
 | |
|  * Returns the PubidLiteral parsed or NULL.
 | |
|  */
 | |
| 
 | |
| xmlChar *
 | |
| xmlParsePubidLiteral(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar *buf = NULL;
 | |
|     int len = 0;
 | |
|     int size = XML_PARSER_BUFFER_SIZE;
 | |
|     int maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                     XML_MAX_TEXT_LENGTH :
 | |
|                     XML_MAX_NAME_LENGTH;
 | |
|     xmlChar cur;
 | |
|     xmlChar stop;
 | |
|     xmlParserInputState oldstate = ctxt->instate;
 | |
| 
 | |
|     if (RAW == '"') {
 | |
|         NEXT;
 | |
| 	stop = '"';
 | |
|     } else if (RAW == '\'') {
 | |
|         NEXT;
 | |
| 	stop = '\'';
 | |
|     } else {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_LITERAL_NOT_STARTED, NULL);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     buf = (xmlChar *) xmlMallocAtomic(size);
 | |
|     if (buf == NULL) {
 | |
| 	xmlErrMemory(ctxt, NULL);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     ctxt->instate = XML_PARSER_PUBLIC_LITERAL;
 | |
|     cur = CUR;
 | |
|     while ((IS_PUBIDCHAR_CH(cur)) && (cur != stop)) { /* checked */
 | |
| 	if (len + 1 >= size) {
 | |
| 	    xmlChar *tmp;
 | |
| 
 | |
| 	    size *= 2;
 | |
| 	    tmp = (xmlChar *) xmlRealloc(buf, size);
 | |
| 	    if (tmp == NULL) {
 | |
| 		xmlErrMemory(ctxt, NULL);
 | |
| 		xmlFree(buf);
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    buf = tmp;
 | |
| 	}
 | |
| 	buf[len++] = cur;
 | |
|         if (len > maxLength) {
 | |
|             xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "Public ID");
 | |
|             xmlFree(buf);
 | |
|             return(NULL);
 | |
|         }
 | |
| 	NEXT;
 | |
| 	cur = CUR;
 | |
|     }
 | |
|     buf[len] = 0;
 | |
|     if (ctxt->instate == XML_PARSER_EOF) {
 | |
|         xmlFree(buf);
 | |
|         return(NULL);
 | |
|     }
 | |
|     if (cur != stop) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_LITERAL_NOT_FINISHED, NULL);
 | |
|     } else {
 | |
| 	NEXTL(1);
 | |
|     }
 | |
|     ctxt->instate = oldstate;
 | |
|     return(buf);
 | |
| }
 | |
| 
 | |
| static void xmlParseCharDataComplex(xmlParserCtxtPtr ctxt, int partial);
 | |
| 
 | |
| /*
 | |
|  * used for the test in the inner loop of the char data testing
 | |
|  */
 | |
| static const unsigned char test_char_data[256] = {
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x09, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* 0x9, CR/LF separated */
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x20, 0x21, 0x22, 0x23, 0x24, 0x25, 0x00, 0x27, /* & */
 | |
|     0x28, 0x29, 0x2A, 0x2B, 0x2C, 0x2D, 0x2E, 0x2F,
 | |
|     0x30, 0x31, 0x32, 0x33, 0x34, 0x35, 0x36, 0x37,
 | |
|     0x38, 0x39, 0x3A, 0x3B, 0x00, 0x3D, 0x3E, 0x3F, /* < */
 | |
|     0x40, 0x41, 0x42, 0x43, 0x44, 0x45, 0x46, 0x47,
 | |
|     0x48, 0x49, 0x4A, 0x4B, 0x4C, 0x4D, 0x4E, 0x4F,
 | |
|     0x50, 0x51, 0x52, 0x53, 0x54, 0x55, 0x56, 0x57,
 | |
|     0x58, 0x59, 0x5A, 0x5B, 0x5C, 0x00, 0x5E, 0x5F, /* ] */
 | |
|     0x60, 0x61, 0x62, 0x63, 0x64, 0x65, 0x66, 0x67,
 | |
|     0x68, 0x69, 0x6A, 0x6B, 0x6C, 0x6D, 0x6E, 0x6F,
 | |
|     0x70, 0x71, 0x72, 0x73, 0x74, 0x75, 0x76, 0x77,
 | |
|     0x78, 0x79, 0x7A, 0x7B, 0x7C, 0x7D, 0x7E, 0x7F,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, /* non-ascii */
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00,
 | |
|     0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00, 0x00
 | |
| };
 | |
| 
 | |
| /**
 | |
|  * xmlParseCharDataInternal:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @partial:  buffer may contain partial UTF-8 sequences
 | |
|  *
 | |
|  * Parse character data. Always makes progress if the first char isn't
 | |
|  * '<' or '&'.
 | |
|  *
 | |
|  * The right angle bracket (>) may be represented using the string ">",
 | |
|  * and must, for compatibility, be escaped using ">" or a character
 | |
|  * reference when it appears in the string "]]>" in content, when that
 | |
|  * string is not marking the end of a CDATA section.
 | |
|  *
 | |
|  * [14] CharData ::= [^<&]* - ([^<&]* ']]>' [^<&]*)
 | |
|  */
 | |
| static void
 | |
| xmlParseCharDataInternal(xmlParserCtxtPtr ctxt, int partial) {
 | |
|     const xmlChar *in;
 | |
|     int nbchar = 0;
 | |
|     int line = ctxt->input->line;
 | |
|     int col = ctxt->input->col;
 | |
|     int ccol;
 | |
| 
 | |
|     GROW;
 | |
|     /*
 | |
|      * Accelerated common case where input don't need to be
 | |
|      * modified before passing it to the handler.
 | |
|      */
 | |
|     in = ctxt->input->cur;
 | |
|     do {
 | |
| get_more_space:
 | |
|         while (*in == 0x20) { in++; ctxt->input->col++; }
 | |
|         if (*in == 0xA) {
 | |
|             do {
 | |
|                 ctxt->input->line++; ctxt->input->col = 1;
 | |
|                 in++;
 | |
|             } while (*in == 0xA);
 | |
|             goto get_more_space;
 | |
|         }
 | |
|         if (*in == '<') {
 | |
|             nbchar = in - ctxt->input->cur;
 | |
|             if (nbchar > 0) {
 | |
|                 const xmlChar *tmp = ctxt->input->cur;
 | |
|                 ctxt->input->cur = in;
 | |
| 
 | |
|                 if ((ctxt->sax != NULL) &&
 | |
|                     (ctxt->disableSAX == 0) &&
 | |
|                     (ctxt->sax->ignorableWhitespace !=
 | |
|                      ctxt->sax->characters)) {
 | |
|                     if (areBlanks(ctxt, tmp, nbchar, 1)) {
 | |
|                         if (ctxt->sax->ignorableWhitespace != NULL)
 | |
|                             ctxt->sax->ignorableWhitespace(ctxt->userData,
 | |
|                                                    tmp, nbchar);
 | |
|                     } else {
 | |
|                         if (ctxt->sax->characters != NULL)
 | |
|                             ctxt->sax->characters(ctxt->userData,
 | |
|                                                   tmp, nbchar);
 | |
|                         if (*ctxt->space == -1)
 | |
|                             *ctxt->space = -2;
 | |
|                     }
 | |
|                 } else if ((ctxt->sax != NULL) &&
 | |
|                            (ctxt->disableSAX == 0) &&
 | |
|                            (ctxt->sax->characters != NULL)) {
 | |
|                     ctxt->sax->characters(ctxt->userData,
 | |
|                                           tmp, nbchar);
 | |
|                 }
 | |
|             }
 | |
|             return;
 | |
|         }
 | |
| 
 | |
| get_more:
 | |
|         ccol = ctxt->input->col;
 | |
|         while (test_char_data[*in]) {
 | |
|             in++;
 | |
|             ccol++;
 | |
|         }
 | |
|         ctxt->input->col = ccol;
 | |
|         if (*in == 0xA) {
 | |
|             do {
 | |
|                 ctxt->input->line++; ctxt->input->col = 1;
 | |
|                 in++;
 | |
|             } while (*in == 0xA);
 | |
|             goto get_more;
 | |
|         }
 | |
|         if (*in == ']') {
 | |
|             if ((in[1] == ']') && (in[2] == '>')) {
 | |
|                 xmlFatalErr(ctxt, XML_ERR_MISPLACED_CDATA_END, NULL);
 | |
|                 if (ctxt->instate != XML_PARSER_EOF)
 | |
|                     ctxt->input->cur = in + 1;
 | |
|                 return;
 | |
|             }
 | |
|             in++;
 | |
|             ctxt->input->col++;
 | |
|             goto get_more;
 | |
|         }
 | |
|         nbchar = in - ctxt->input->cur;
 | |
|         if (nbchar > 0) {
 | |
|             if ((ctxt->sax != NULL) &&
 | |
|                 (ctxt->disableSAX == 0) &&
 | |
|                 (ctxt->sax->ignorableWhitespace !=
 | |
|                  ctxt->sax->characters) &&
 | |
|                 (IS_BLANK_CH(*ctxt->input->cur))) {
 | |
|                 const xmlChar *tmp = ctxt->input->cur;
 | |
|                 ctxt->input->cur = in;
 | |
| 
 | |
|                 if (areBlanks(ctxt, tmp, nbchar, 0)) {
 | |
|                     if (ctxt->sax->ignorableWhitespace != NULL)
 | |
|                         ctxt->sax->ignorableWhitespace(ctxt->userData,
 | |
|                                                        tmp, nbchar);
 | |
|                 } else {
 | |
|                     if (ctxt->sax->characters != NULL)
 | |
|                         ctxt->sax->characters(ctxt->userData,
 | |
|                                               tmp, nbchar);
 | |
|                     if (*ctxt->space == -1)
 | |
|                         *ctxt->space = -2;
 | |
|                 }
 | |
|                 line = ctxt->input->line;
 | |
|                 col = ctxt->input->col;
 | |
|             } else if ((ctxt->sax != NULL) &&
 | |
|                        (ctxt->disableSAX == 0)) {
 | |
|                 if (ctxt->sax->characters != NULL)
 | |
|                     ctxt->sax->characters(ctxt->userData,
 | |
|                                           ctxt->input->cur, nbchar);
 | |
|                 line = ctxt->input->line;
 | |
|                 col = ctxt->input->col;
 | |
|             }
 | |
|             if (ctxt->instate == XML_PARSER_EOF)
 | |
|                 return;
 | |
|         }
 | |
|         ctxt->input->cur = in;
 | |
|         if (*in == 0xD) {
 | |
|             in++;
 | |
|             if (*in == 0xA) {
 | |
|                 ctxt->input->cur = in;
 | |
|                 in++;
 | |
|                 ctxt->input->line++; ctxt->input->col = 1;
 | |
|                 continue; /* while */
 | |
|             }
 | |
|             in--;
 | |
|         }
 | |
|         if (*in == '<') {
 | |
|             return;
 | |
|         }
 | |
|         if (*in == '&') {
 | |
|             return;
 | |
|         }
 | |
|         SHRINK;
 | |
|         GROW;
 | |
|         if (ctxt->instate == XML_PARSER_EOF)
 | |
|             return;
 | |
|         in = ctxt->input->cur;
 | |
|     } while (((*in >= 0x20) && (*in <= 0x7F)) ||
 | |
|              (*in == 0x09) || (*in == 0x0a));
 | |
|     ctxt->input->line = line;
 | |
|     ctxt->input->col = col;
 | |
|     xmlParseCharDataComplex(ctxt, partial);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseCharDataComplex:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @cdata:  int indicating whether we are within a CDATA section
 | |
|  *
 | |
|  * Always makes progress if the first char isn't '<' or '&'.
 | |
|  *
 | |
|  * parse a CharData section.this is the fallback function
 | |
|  * of xmlParseCharData() when the parsing requires handling
 | |
|  * of non-ASCII characters.
 | |
|  */
 | |
| static void
 | |
| xmlParseCharDataComplex(xmlParserCtxtPtr ctxt, int partial) {
 | |
|     xmlChar buf[XML_PARSER_BIG_BUFFER_SIZE + 5];
 | |
|     int nbchar = 0;
 | |
|     int cur, l;
 | |
| 
 | |
|     cur = CUR_CHAR(l);
 | |
|     while ((cur != '<') && /* checked */
 | |
|            (cur != '&') &&
 | |
| 	   (IS_CHAR(cur))) {
 | |
| 	if ((cur == ']') && (NXT(1) == ']') && (NXT(2) == '>')) {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_MISPLACED_CDATA_END, NULL);
 | |
| 	}
 | |
| 	COPY_BUF(buf, nbchar, cur);
 | |
| 	/* move current position before possible calling of ctxt->sax->characters */
 | |
| 	NEXTL(l);
 | |
| 	if (nbchar >= XML_PARSER_BIG_BUFFER_SIZE) {
 | |
| 	    buf[nbchar] = 0;
 | |
| 
 | |
| 	    /*
 | |
| 	     * OK the segment is to be consumed as chars.
 | |
| 	     */
 | |
| 	    if ((ctxt->sax != NULL) && (!ctxt->disableSAX)) {
 | |
| 		if (areBlanks(ctxt, buf, nbchar, 0)) {
 | |
| 		    if (ctxt->sax->ignorableWhitespace != NULL)
 | |
| 			ctxt->sax->ignorableWhitespace(ctxt->userData,
 | |
| 			                               buf, nbchar);
 | |
| 		} else {
 | |
| 		    if (ctxt->sax->characters != NULL)
 | |
| 			ctxt->sax->characters(ctxt->userData, buf, nbchar);
 | |
| 		    if ((ctxt->sax->characters !=
 | |
| 		         ctxt->sax->ignorableWhitespace) &&
 | |
| 			(*ctxt->space == -1))
 | |
| 			*ctxt->space = -2;
 | |
| 		}
 | |
| 	    }
 | |
| 	    nbchar = 0;
 | |
|             /* something really bad happened in the SAX callback */
 | |
|             if (ctxt->instate != XML_PARSER_CONTENT)
 | |
|                 return;
 | |
|             SHRINK;
 | |
| 	}
 | |
| 	cur = CUR_CHAR(l);
 | |
|     }
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return;
 | |
|     if (nbchar != 0) {
 | |
|         buf[nbchar] = 0;
 | |
| 	/*
 | |
| 	 * OK the segment is to be consumed as chars.
 | |
| 	 */
 | |
| 	if ((ctxt->sax != NULL) && (!ctxt->disableSAX)) {
 | |
| 	    if (areBlanks(ctxt, buf, nbchar, 0)) {
 | |
| 		if (ctxt->sax->ignorableWhitespace != NULL)
 | |
| 		    ctxt->sax->ignorableWhitespace(ctxt->userData, buf, nbchar);
 | |
| 	    } else {
 | |
| 		if (ctxt->sax->characters != NULL)
 | |
| 		    ctxt->sax->characters(ctxt->userData, buf, nbchar);
 | |
| 		if ((ctxt->sax->characters != ctxt->sax->ignorableWhitespace) &&
 | |
| 		    (*ctxt->space == -1))
 | |
| 		    *ctxt->space = -2;
 | |
| 	    }
 | |
| 	}
 | |
|     }
 | |
|     /*
 | |
|      * cur == 0 can mean
 | |
|      *
 | |
|      * - XML_PARSER_EOF or memory error. This is checked above.
 | |
|      * - An actual 0 character.
 | |
|      * - End of buffer.
 | |
|      * - An incomplete UTF-8 sequence. This is allowed if partial is set.
 | |
|      */
 | |
|     if (ctxt->input->cur < ctxt->input->end) {
 | |
|         if ((cur == 0) && (CUR != 0)) {
 | |
|             if (partial == 0) {
 | |
|                 xmlFatalErrMsgInt(ctxt, XML_ERR_INVALID_CHAR,
 | |
|                         "Incomplete UTF-8 sequence starting with %02X\n", CUR);
 | |
|                 NEXTL(1);
 | |
|             }
 | |
|         } else if ((cur != '<') && (cur != '&')) {
 | |
|             /* Generate the error and skip the offending character */
 | |
|             xmlFatalErrMsgInt(ctxt, XML_ERR_INVALID_CHAR,
 | |
|                               "PCDATA invalid Char value %d\n", cur);
 | |
|             NEXTL(l);
 | |
|         }
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseCharData:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @cdata:  unused
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  */
 | |
| void
 | |
| xmlParseCharData(xmlParserCtxtPtr ctxt, ATTRIBUTE_UNUSED int cdata) {
 | |
|     xmlParseCharDataInternal(ctxt, 0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseExternalID:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @publicID:  a xmlChar** receiving PubidLiteral
 | |
|  * @strict: indicate whether we should restrict parsing to only
 | |
|  *          production [75], see NOTE below
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse an External ID or a Public ID
 | |
|  *
 | |
|  * NOTE: Productions [75] and [83] interact badly since [75] can generate
 | |
|  *       'PUBLIC' S PubidLiteral S SystemLiteral
 | |
|  *
 | |
|  * [75] ExternalID ::= 'SYSTEM' S SystemLiteral
 | |
|  *                   | 'PUBLIC' S PubidLiteral S SystemLiteral
 | |
|  *
 | |
|  * [83] PublicID ::= 'PUBLIC' S PubidLiteral
 | |
|  *
 | |
|  * Returns the function returns SystemLiteral and in the second
 | |
|  *                case publicID receives PubidLiteral, is strict is off
 | |
|  *                it is possible to return NULL and have publicID set.
 | |
|  */
 | |
| 
 | |
| xmlChar *
 | |
| xmlParseExternalID(xmlParserCtxtPtr ctxt, xmlChar **publicID, int strict) {
 | |
|     xmlChar *URI = NULL;
 | |
| 
 | |
|     *publicID = NULL;
 | |
|     if (CMP6(CUR_PTR, 'S', 'Y', 'S', 'T', 'E', 'M')) {
 | |
|         SKIP(6);
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 	                   "Space required after 'SYSTEM'\n");
 | |
| 	}
 | |
| 	URI = xmlParseSystemLiteral(ctxt);
 | |
| 	if (URI == NULL) {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_URI_REQUIRED, NULL);
 | |
|         }
 | |
|     } else if (CMP6(CUR_PTR, 'P', 'U', 'B', 'L', 'I', 'C')) {
 | |
|         SKIP(6);
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 		    "Space required after 'PUBLIC'\n");
 | |
| 	}
 | |
| 	*publicID = xmlParsePubidLiteral(ctxt);
 | |
| 	if (*publicID == NULL) {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_PUBID_REQUIRED, NULL);
 | |
| 	}
 | |
| 	if (strict) {
 | |
| 	    /*
 | |
| 	     * We don't handle [83] so "S SystemLiteral" is required.
 | |
| 	     */
 | |
| 	    if (SKIP_BLANKS == 0) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			"Space required after the Public Identifier\n");
 | |
| 	    }
 | |
| 	} else {
 | |
| 	    /*
 | |
| 	     * We handle [83] so we return immediately, if
 | |
| 	     * "S SystemLiteral" is not detected. We skip blanks if no
 | |
|              * system literal was found, but this is harmless since we must
 | |
|              * be at the end of a NotationDecl.
 | |
| 	     */
 | |
| 	    if (SKIP_BLANKS == 0) return(NULL);
 | |
| 	    if ((CUR != '\'') && (CUR != '"')) return(NULL);
 | |
| 	}
 | |
| 	URI = xmlParseSystemLiteral(ctxt);
 | |
| 	if (URI == NULL) {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_URI_REQUIRED, NULL);
 | |
|         }
 | |
|     }
 | |
|     return(URI);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseCommentComplex:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @buf:  the already parsed part of the buffer
 | |
|  * @len:  number of bytes in the buffer
 | |
|  * @size:  allocated size of the buffer
 | |
|  *
 | |
|  * Skip an XML (SGML) comment <!-- .... -->
 | |
|  *  The spec says that "For compatibility, the string "--" (double-hyphen)
 | |
|  *  must not occur within comments. "
 | |
|  * This is the slow routine in case the accelerator for ascii didn't work
 | |
|  *
 | |
|  * [15] Comment ::= '<!--' ((Char - '-') | ('-' (Char - '-')))* '-->'
 | |
|  */
 | |
| static void
 | |
| xmlParseCommentComplex(xmlParserCtxtPtr ctxt, xmlChar *buf,
 | |
|                        size_t len, size_t size) {
 | |
|     int q, ql;
 | |
|     int r, rl;
 | |
|     int cur, l;
 | |
|     size_t maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                        XML_MAX_HUGE_LENGTH :
 | |
|                        XML_MAX_TEXT_LENGTH;
 | |
|     int inputid;
 | |
| 
 | |
|     inputid = ctxt->input->id;
 | |
| 
 | |
|     if (buf == NULL) {
 | |
|         len = 0;
 | |
| 	size = XML_PARSER_BUFFER_SIZE;
 | |
| 	buf = (xmlChar *) xmlMallocAtomic(size);
 | |
| 	if (buf == NULL) {
 | |
| 	    xmlErrMemory(ctxt, NULL);
 | |
| 	    return;
 | |
| 	}
 | |
|     }
 | |
|     q = CUR_CHAR(ql);
 | |
|     if (q == 0)
 | |
|         goto not_terminated;
 | |
|     if (!IS_CHAR(q)) {
 | |
|         xmlFatalErrMsgInt(ctxt, XML_ERR_INVALID_CHAR,
 | |
|                           "xmlParseComment: invalid xmlChar value %d\n",
 | |
| 	                  q);
 | |
| 	xmlFree (buf);
 | |
| 	return;
 | |
|     }
 | |
|     NEXTL(ql);
 | |
|     r = CUR_CHAR(rl);
 | |
|     if (r == 0)
 | |
|         goto not_terminated;
 | |
|     if (!IS_CHAR(r)) {
 | |
|         xmlFatalErrMsgInt(ctxt, XML_ERR_INVALID_CHAR,
 | |
|                           "xmlParseComment: invalid xmlChar value %d\n",
 | |
| 	                  r);
 | |
| 	xmlFree (buf);
 | |
| 	return;
 | |
|     }
 | |
|     NEXTL(rl);
 | |
|     cur = CUR_CHAR(l);
 | |
|     if (cur == 0)
 | |
|         goto not_terminated;
 | |
|     while (IS_CHAR(cur) && /* checked */
 | |
|            ((cur != '>') ||
 | |
| 	    (r != '-') || (q != '-'))) {
 | |
| 	if ((r == '-') && (q == '-')) {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_HYPHEN_IN_COMMENT, NULL);
 | |
| 	}
 | |
| 	if (len + 5 >= size) {
 | |
| 	    xmlChar *new_buf;
 | |
|             size_t new_size;
 | |
| 
 | |
| 	    new_size = size * 2;
 | |
| 	    new_buf = (xmlChar *) xmlRealloc(buf, new_size);
 | |
| 	    if (new_buf == NULL) {
 | |
| 		xmlFree (buf);
 | |
| 		xmlErrMemory(ctxt, NULL);
 | |
| 		return;
 | |
| 	    }
 | |
| 	    buf = new_buf;
 | |
|             size = new_size;
 | |
| 	}
 | |
| 	COPY_BUF(buf, len, q);
 | |
|         if (len > maxLength) {
 | |
|             xmlFatalErrMsgStr(ctxt, XML_ERR_COMMENT_NOT_FINISHED,
 | |
|                          "Comment too big found", NULL);
 | |
|             xmlFree (buf);
 | |
|             return;
 | |
|         }
 | |
| 
 | |
| 	q = r;
 | |
| 	ql = rl;
 | |
| 	r = cur;
 | |
| 	rl = l;
 | |
| 
 | |
| 	NEXTL(l);
 | |
| 	cur = CUR_CHAR(l);
 | |
| 
 | |
|     }
 | |
|     buf[len] = 0;
 | |
|     if (ctxt->instate == XML_PARSER_EOF) {
 | |
|         xmlFree(buf);
 | |
|         return;
 | |
|     }
 | |
|     if (cur == 0) {
 | |
| 	xmlFatalErrMsgStr(ctxt, XML_ERR_COMMENT_NOT_FINISHED,
 | |
| 	                     "Comment not terminated \n<!--%.50s\n", buf);
 | |
|     } else if (!IS_CHAR(cur)) {
 | |
|         xmlFatalErrMsgInt(ctxt, XML_ERR_INVALID_CHAR,
 | |
|                           "xmlParseComment: invalid xmlChar value %d\n",
 | |
| 	                  cur);
 | |
|     } else {
 | |
| 	if (inputid != ctxt->input->id) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
| 		           "Comment doesn't start and stop in the same"
 | |
|                            " entity\n");
 | |
| 	}
 | |
|         NEXT;
 | |
| 	if ((ctxt->sax != NULL) && (ctxt->sax->comment != NULL) &&
 | |
| 	    (!ctxt->disableSAX))
 | |
| 	    ctxt->sax->comment(ctxt->userData, buf);
 | |
|     }
 | |
|     xmlFree(buf);
 | |
|     return;
 | |
| not_terminated:
 | |
|     xmlFatalErrMsgStr(ctxt, XML_ERR_COMMENT_NOT_FINISHED,
 | |
| 			 "Comment not terminated\n", NULL);
 | |
|     xmlFree(buf);
 | |
|     return;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseComment:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse an XML (SGML) comment. Always consumes '<!'.
 | |
|  *
 | |
|  *  The spec says that "For compatibility, the string "--" (double-hyphen)
 | |
|  *  must not occur within comments. "
 | |
|  *
 | |
|  * [15] Comment ::= '<!--' ((Char - '-') | ('-' (Char - '-')))* '-->'
 | |
|  */
 | |
| void
 | |
| xmlParseComment(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar *buf = NULL;
 | |
|     size_t size = XML_PARSER_BUFFER_SIZE;
 | |
|     size_t len = 0;
 | |
|     size_t maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                        XML_MAX_HUGE_LENGTH :
 | |
|                        XML_MAX_TEXT_LENGTH;
 | |
|     xmlParserInputState state;
 | |
|     const xmlChar *in;
 | |
|     size_t nbchar = 0;
 | |
|     int ccol;
 | |
|     int inputid;
 | |
| 
 | |
|     /*
 | |
|      * Check that there is a comment right here.
 | |
|      */
 | |
|     if ((RAW != '<') || (NXT(1) != '!'))
 | |
|         return;
 | |
|     SKIP(2);
 | |
|     if ((RAW != '-') || (NXT(1) != '-'))
 | |
|         return;
 | |
|     state = ctxt->instate;
 | |
|     ctxt->instate = XML_PARSER_COMMENT;
 | |
|     inputid = ctxt->input->id;
 | |
|     SKIP(2);
 | |
|     GROW;
 | |
| 
 | |
|     /*
 | |
|      * Accelerated common case where input don't need to be
 | |
|      * modified before passing it to the handler.
 | |
|      */
 | |
|     in = ctxt->input->cur;
 | |
|     do {
 | |
| 	if (*in == 0xA) {
 | |
| 	    do {
 | |
| 		ctxt->input->line++; ctxt->input->col = 1;
 | |
| 		in++;
 | |
| 	    } while (*in == 0xA);
 | |
| 	}
 | |
| get_more:
 | |
|         ccol = ctxt->input->col;
 | |
| 	while (((*in > '-') && (*in <= 0x7F)) ||
 | |
| 	       ((*in >= 0x20) && (*in < '-')) ||
 | |
| 	       (*in == 0x09)) {
 | |
| 		    in++;
 | |
| 		    ccol++;
 | |
| 	}
 | |
| 	ctxt->input->col = ccol;
 | |
| 	if (*in == 0xA) {
 | |
| 	    do {
 | |
| 		ctxt->input->line++; ctxt->input->col = 1;
 | |
| 		in++;
 | |
| 	    } while (*in == 0xA);
 | |
| 	    goto get_more;
 | |
| 	}
 | |
| 	nbchar = in - ctxt->input->cur;
 | |
| 	/*
 | |
| 	 * save current set of data
 | |
| 	 */
 | |
| 	if (nbchar > 0) {
 | |
|             if (buf == NULL) {
 | |
|                 if ((*in == '-') && (in[1] == '-'))
 | |
|                     size = nbchar + 1;
 | |
|                 else
 | |
|                     size = XML_PARSER_BUFFER_SIZE + nbchar;
 | |
|                 buf = (xmlChar *) xmlMallocAtomic(size);
 | |
|                 if (buf == NULL) {
 | |
|                     xmlErrMemory(ctxt, NULL);
 | |
|                     ctxt->instate = state;
 | |
|                     return;
 | |
|                 }
 | |
|                 len = 0;
 | |
|             } else if (len + nbchar + 1 >= size) {
 | |
|                 xmlChar *new_buf;
 | |
|                 size  += len + nbchar + XML_PARSER_BUFFER_SIZE;
 | |
|                 new_buf = (xmlChar *) xmlRealloc(buf, size);
 | |
|                 if (new_buf == NULL) {
 | |
|                     xmlFree (buf);
 | |
|                     xmlErrMemory(ctxt, NULL);
 | |
|                     ctxt->instate = state;
 | |
|                     return;
 | |
|                 }
 | |
|                 buf = new_buf;
 | |
|             }
 | |
|             memcpy(&buf[len], ctxt->input->cur, nbchar);
 | |
|             len += nbchar;
 | |
|             buf[len] = 0;
 | |
| 	}
 | |
|         if (len > maxLength) {
 | |
|             xmlFatalErrMsgStr(ctxt, XML_ERR_COMMENT_NOT_FINISHED,
 | |
|                          "Comment too big found", NULL);
 | |
|             xmlFree (buf);
 | |
|             return;
 | |
|         }
 | |
| 	ctxt->input->cur = in;
 | |
| 	if (*in == 0xA) {
 | |
| 	    in++;
 | |
| 	    ctxt->input->line++; ctxt->input->col = 1;
 | |
| 	}
 | |
| 	if (*in == 0xD) {
 | |
| 	    in++;
 | |
| 	    if (*in == 0xA) {
 | |
| 		ctxt->input->cur = in;
 | |
| 		in++;
 | |
| 		ctxt->input->line++; ctxt->input->col = 1;
 | |
| 		goto get_more;
 | |
| 	    }
 | |
| 	    in--;
 | |
| 	}
 | |
| 	SHRINK;
 | |
| 	GROW;
 | |
|         if (ctxt->instate == XML_PARSER_EOF) {
 | |
|             xmlFree(buf);
 | |
|             return;
 | |
|         }
 | |
| 	in = ctxt->input->cur;
 | |
| 	if (*in == '-') {
 | |
| 	    if (in[1] == '-') {
 | |
| 	        if (in[2] == '>') {
 | |
| 		    if (ctxt->input->id != inputid) {
 | |
| 			xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
| 			               "comment doesn't start and stop in the"
 | |
|                                        " same entity\n");
 | |
| 		    }
 | |
| 		    SKIP(3);
 | |
| 		    if ((ctxt->sax != NULL) && (ctxt->sax->comment != NULL) &&
 | |
| 		        (!ctxt->disableSAX)) {
 | |
| 			if (buf != NULL)
 | |
| 			    ctxt->sax->comment(ctxt->userData, buf);
 | |
| 			else
 | |
| 			    ctxt->sax->comment(ctxt->userData, BAD_CAST "");
 | |
| 		    }
 | |
| 		    if (buf != NULL)
 | |
| 		        xmlFree(buf);
 | |
| 		    if (ctxt->instate != XML_PARSER_EOF)
 | |
| 			ctxt->instate = state;
 | |
| 		    return;
 | |
| 		}
 | |
| 		if (buf != NULL) {
 | |
| 		    xmlFatalErrMsgStr(ctxt, XML_ERR_HYPHEN_IN_COMMENT,
 | |
| 		                      "Double hyphen within comment: "
 | |
|                                       "<!--%.50s\n",
 | |
| 				      buf);
 | |
| 		} else
 | |
| 		    xmlFatalErrMsgStr(ctxt, XML_ERR_HYPHEN_IN_COMMENT,
 | |
| 		                      "Double hyphen within comment\n", NULL);
 | |
|                 if (ctxt->instate == XML_PARSER_EOF) {
 | |
|                     xmlFree(buf);
 | |
|                     return;
 | |
|                 }
 | |
| 		in++;
 | |
| 		ctxt->input->col++;
 | |
| 	    }
 | |
| 	    in++;
 | |
| 	    ctxt->input->col++;
 | |
| 	    goto get_more;
 | |
| 	}
 | |
|     } while (((*in >= 0x20) && (*in <= 0x7F)) || (*in == 0x09) || (*in == 0x0a));
 | |
|     xmlParseCommentComplex(ctxt, buf, len, size);
 | |
|     ctxt->instate = state;
 | |
|     return;
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|  * xmlParsePITarget:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse the name of a PI
 | |
|  *
 | |
|  * [17] PITarget ::= Name - (('X' | 'x') ('M' | 'm') ('L' | 'l'))
 | |
|  *
 | |
|  * Returns the PITarget name or NULL
 | |
|  */
 | |
| 
 | |
| const xmlChar *
 | |
| xmlParsePITarget(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *name;
 | |
| 
 | |
|     name = xmlParseName(ctxt);
 | |
|     if ((name != NULL) &&
 | |
|         ((name[0] == 'x') || (name[0] == 'X')) &&
 | |
|         ((name[1] == 'm') || (name[1] == 'M')) &&
 | |
|         ((name[2] == 'l') || (name[2] == 'L'))) {
 | |
| 	int i;
 | |
| 	if ((name[0] == 'x') && (name[1] == 'm') &&
 | |
| 	    (name[2] == 'l') && (name[3] == 0)) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_RESERVED_XML_NAME,
 | |
| 		 "XML declaration allowed only at the start of the document\n");
 | |
| 	    return(name);
 | |
| 	} else if (name[3] == 0) {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_RESERVED_XML_NAME, NULL);
 | |
| 	    return(name);
 | |
| 	}
 | |
| 	for (i = 0;;i++) {
 | |
| 	    if (xmlW3CPIs[i] == NULL) break;
 | |
| 	    if (xmlStrEqual(name, (const xmlChar *)xmlW3CPIs[i]))
 | |
| 	        return(name);
 | |
| 	}
 | |
| 	xmlWarningMsg(ctxt, XML_ERR_RESERVED_XML_NAME,
 | |
| 		      "xmlParsePITarget: invalid name prefix 'xml'\n",
 | |
| 		      NULL, NULL);
 | |
|     }
 | |
|     if ((name != NULL) && (xmlStrchr(name, ':') != NULL)) {
 | |
| 	xmlNsErr(ctxt, XML_NS_ERR_COLON,
 | |
| 		 "colons are forbidden from PI names '%s'\n", name, NULL, NULL);
 | |
|     }
 | |
|     return(name);
 | |
| }
 | |
| 
 | |
| #ifdef LIBXML_CATALOG_ENABLED
 | |
| /**
 | |
|  * xmlParseCatalogPI:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @catalog:  the PI value string
 | |
|  *
 | |
|  * parse an XML Catalog Processing Instruction.
 | |
|  *
 | |
|  * <?oasis-xml-catalog catalog="http://example.com/catalog.xml"?>
 | |
|  *
 | |
|  * Occurs only if allowed by the user and if happening in the Misc
 | |
|  * part of the document before any doctype information
 | |
|  * This will add the given catalog to the parsing context in order
 | |
|  * to be used if there is a resolution need further down in the document
 | |
|  */
 | |
| 
 | |
| static void
 | |
| xmlParseCatalogPI(xmlParserCtxtPtr ctxt, const xmlChar *catalog) {
 | |
|     xmlChar *URL = NULL;
 | |
|     const xmlChar *tmp, *base;
 | |
|     xmlChar marker;
 | |
| 
 | |
|     tmp = catalog;
 | |
|     while (IS_BLANK_CH(*tmp)) tmp++;
 | |
|     if (xmlStrncmp(tmp, BAD_CAST"catalog", 7))
 | |
| 	goto error;
 | |
|     tmp += 7;
 | |
|     while (IS_BLANK_CH(*tmp)) tmp++;
 | |
|     if (*tmp != '=') {
 | |
| 	return;
 | |
|     }
 | |
|     tmp++;
 | |
|     while (IS_BLANK_CH(*tmp)) tmp++;
 | |
|     marker = *tmp;
 | |
|     if ((marker != '\'') && (marker != '"'))
 | |
| 	goto error;
 | |
|     tmp++;
 | |
|     base = tmp;
 | |
|     while ((*tmp != 0) && (*tmp != marker)) tmp++;
 | |
|     if (*tmp == 0)
 | |
| 	goto error;
 | |
|     URL = xmlStrndup(base, tmp - base);
 | |
|     tmp++;
 | |
|     while (IS_BLANK_CH(*tmp)) tmp++;
 | |
|     if (*tmp != 0)
 | |
| 	goto error;
 | |
| 
 | |
|     if (URL != NULL) {
 | |
| 	ctxt->catalogs = xmlCatalogAddLocal(ctxt->catalogs, URL);
 | |
| 	xmlFree(URL);
 | |
|     }
 | |
|     return;
 | |
| 
 | |
| error:
 | |
|     xmlWarningMsg(ctxt, XML_WAR_CATALOG_PI,
 | |
| 	          "Catalog PI syntax error: %s\n",
 | |
| 		  catalog, NULL);
 | |
|     if (URL != NULL)
 | |
| 	xmlFree(URL);
 | |
| }
 | |
| #endif
 | |
| 
 | |
| /**
 | |
|  * xmlParsePI:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an XML Processing Instruction.
 | |
|  *
 | |
|  * [16] PI ::= '<?' PITarget (S (Char* - (Char* '?>' Char*)))? '?>'
 | |
|  *
 | |
|  * The processing is transferred to SAX once parsed.
 | |
|  */
 | |
| 
 | |
| void
 | |
| xmlParsePI(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar *buf = NULL;
 | |
|     size_t len = 0;
 | |
|     size_t size = XML_PARSER_BUFFER_SIZE;
 | |
|     size_t maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                        XML_MAX_HUGE_LENGTH :
 | |
|                        XML_MAX_TEXT_LENGTH;
 | |
|     int cur, l;
 | |
|     const xmlChar *target;
 | |
|     xmlParserInputState state;
 | |
| 
 | |
|     if ((RAW == '<') && (NXT(1) == '?')) {
 | |
| 	int inputid = ctxt->input->id;
 | |
| 	state = ctxt->instate;
 | |
|         ctxt->instate = XML_PARSER_PI;
 | |
| 	/*
 | |
| 	 * this is a Processing Instruction.
 | |
| 	 */
 | |
| 	SKIP(2);
 | |
| 
 | |
| 	/*
 | |
| 	 * Parse the target name and check for special support like
 | |
| 	 * namespace.
 | |
| 	 */
 | |
|         target = xmlParsePITarget(ctxt);
 | |
| 	if (target != NULL) {
 | |
| 	    if ((RAW == '?') && (NXT(1) == '>')) {
 | |
| 		if (inputid != ctxt->input->id) {
 | |
| 		    xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
| 	                           "PI declaration doesn't start and stop in"
 | |
|                                    " the same entity\n");
 | |
| 		}
 | |
| 		SKIP(2);
 | |
| 
 | |
| 		/*
 | |
| 		 * SAX: PI detected.
 | |
| 		 */
 | |
| 		if ((ctxt->sax) && (!ctxt->disableSAX) &&
 | |
| 		    (ctxt->sax->processingInstruction != NULL))
 | |
| 		    ctxt->sax->processingInstruction(ctxt->userData,
 | |
| 		                                     target, NULL);
 | |
| 		if (ctxt->instate != XML_PARSER_EOF)
 | |
| 		    ctxt->instate = state;
 | |
| 		return;
 | |
| 	    }
 | |
| 	    buf = (xmlChar *) xmlMallocAtomic(size);
 | |
| 	    if (buf == NULL) {
 | |
| 		xmlErrMemory(ctxt, NULL);
 | |
| 		ctxt->instate = state;
 | |
| 		return;
 | |
| 	    }
 | |
| 	    if (SKIP_BLANKS == 0) {
 | |
| 		xmlFatalErrMsgStr(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			  "ParsePI: PI %s space expected\n", target);
 | |
| 	    }
 | |
| 	    cur = CUR_CHAR(l);
 | |
| 	    while (IS_CHAR(cur) && /* checked */
 | |
| 		   ((cur != '?') || (NXT(1) != '>'))) {
 | |
| 		if (len + 5 >= size) {
 | |
| 		    xmlChar *tmp;
 | |
|                     size_t new_size = size * 2;
 | |
| 		    tmp = (xmlChar *) xmlRealloc(buf, new_size);
 | |
| 		    if (tmp == NULL) {
 | |
| 			xmlErrMemory(ctxt, NULL);
 | |
| 			xmlFree(buf);
 | |
| 			ctxt->instate = state;
 | |
| 			return;
 | |
| 		    }
 | |
| 		    buf = tmp;
 | |
|                     size = new_size;
 | |
| 		}
 | |
| 		COPY_BUF(buf, len, cur);
 | |
|                 if (len > maxLength) {
 | |
|                     xmlFatalErrMsgStr(ctxt, XML_ERR_PI_NOT_FINISHED,
 | |
|                                       "PI %s too big found", target);
 | |
|                     xmlFree(buf);
 | |
|                     ctxt->instate = state;
 | |
|                     return;
 | |
|                 }
 | |
| 		NEXTL(l);
 | |
| 		cur = CUR_CHAR(l);
 | |
| 	    }
 | |
| 	    buf[len] = 0;
 | |
|             if (ctxt->instate == XML_PARSER_EOF) {
 | |
|                 xmlFree(buf);
 | |
|                 return;
 | |
|             }
 | |
| 	    if (cur != '?') {
 | |
| 		xmlFatalErrMsgStr(ctxt, XML_ERR_PI_NOT_FINISHED,
 | |
| 		      "ParsePI: PI %s never end ...\n", target);
 | |
| 	    } else {
 | |
| 		if (inputid != ctxt->input->id) {
 | |
| 		    xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
| 	                           "PI declaration doesn't start and stop in"
 | |
|                                    " the same entity\n");
 | |
| 		}
 | |
| 		SKIP(2);
 | |
| 
 | |
| #ifdef LIBXML_CATALOG_ENABLED
 | |
| 		if (((state == XML_PARSER_MISC) ||
 | |
| 	             (state == XML_PARSER_START)) &&
 | |
| 		    (xmlStrEqual(target, XML_CATALOG_PI))) {
 | |
| 		    xmlCatalogAllow allow = xmlCatalogGetDefaults();
 | |
| 		    if ((allow == XML_CATA_ALLOW_DOCUMENT) ||
 | |
| 			(allow == XML_CATA_ALLOW_ALL))
 | |
| 			xmlParseCatalogPI(ctxt, buf);
 | |
| 		}
 | |
| #endif
 | |
| 
 | |
| 
 | |
| 		/*
 | |
| 		 * SAX: PI detected.
 | |
| 		 */
 | |
| 		if ((ctxt->sax) && (!ctxt->disableSAX) &&
 | |
| 		    (ctxt->sax->processingInstruction != NULL))
 | |
| 		    ctxt->sax->processingInstruction(ctxt->userData,
 | |
| 		                                     target, buf);
 | |
| 	    }
 | |
| 	    xmlFree(buf);
 | |
| 	} else {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_PI_NOT_STARTED, NULL);
 | |
| 	}
 | |
| 	if (ctxt->instate != XML_PARSER_EOF)
 | |
| 	    ctxt->instate = state;
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseNotationDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse a notation declaration. Always consumes '<!'.
 | |
|  *
 | |
|  * [82] NotationDecl ::= '<!NOTATION' S Name S (ExternalID |  PublicID) S? '>'
 | |
|  *
 | |
|  * Hence there is actually 3 choices:
 | |
|  *     'PUBLIC' S PubidLiteral
 | |
|  *     'PUBLIC' S PubidLiteral S SystemLiteral
 | |
|  * and 'SYSTEM' S SystemLiteral
 | |
|  *
 | |
|  * See the NOTE on xmlParseExternalID().
 | |
|  */
 | |
| 
 | |
| void
 | |
| xmlParseNotationDecl(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *name;
 | |
|     xmlChar *Pubid;
 | |
|     xmlChar *Systemid;
 | |
| 
 | |
|     if ((CUR != '<') || (NXT(1) != '!'))
 | |
|         return;
 | |
|     SKIP(2);
 | |
| 
 | |
|     if (CMP8(CUR_PTR, 'N', 'O', 'T', 'A', 'T', 'I', 'O', 'N')) {
 | |
| 	int inputid = ctxt->input->id;
 | |
| 	SKIP(8);
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			   "Space required after '<!NOTATION'\n");
 | |
| 	    return;
 | |
| 	}
 | |
| 
 | |
|         name = xmlParseName(ctxt);
 | |
| 	if (name == NULL) {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_NOTATION_NOT_STARTED, NULL);
 | |
| 	    return;
 | |
| 	}
 | |
| 	if (xmlStrchr(name, ':') != NULL) {
 | |
| 	    xmlNsErr(ctxt, XML_NS_ERR_COLON,
 | |
| 		     "colons are forbidden from notation names '%s'\n",
 | |
| 		     name, NULL, NULL);
 | |
| 	}
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 		     "Space required after the NOTATION name'\n");
 | |
| 	    return;
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * Parse the IDs.
 | |
| 	 */
 | |
| 	Systemid = xmlParseExternalID(ctxt, &Pubid, 0);
 | |
| 	SKIP_BLANKS;
 | |
| 
 | |
| 	if (RAW == '>') {
 | |
| 	    if (inputid != ctxt->input->id) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
| 	                       "Notation declaration doesn't start and stop"
 | |
|                                " in the same entity\n");
 | |
| 	    }
 | |
| 	    NEXT;
 | |
| 	    if ((ctxt->sax != NULL) && (!ctxt->disableSAX) &&
 | |
| 		(ctxt->sax->notationDecl != NULL))
 | |
| 		ctxt->sax->notationDecl(ctxt->userData, name, Pubid, Systemid);
 | |
| 	} else {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_NOTATION_NOT_FINISHED, NULL);
 | |
| 	}
 | |
| 	if (Systemid != NULL) xmlFree(Systemid);
 | |
| 	if (Pubid != NULL) xmlFree(Pubid);
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseEntityDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse an entity declaration. Always consumes '<!'.
 | |
|  *
 | |
|  * [70] EntityDecl ::= GEDecl | PEDecl
 | |
|  *
 | |
|  * [71] GEDecl ::= '<!ENTITY' S Name S EntityDef S? '>'
 | |
|  *
 | |
|  * [72] PEDecl ::= '<!ENTITY' S '%' S Name S PEDef S? '>'
 | |
|  *
 | |
|  * [73] EntityDef ::= EntityValue | (ExternalID NDataDecl?)
 | |
|  *
 | |
|  * [74] PEDef ::= EntityValue | ExternalID
 | |
|  *
 | |
|  * [76] NDataDecl ::= S 'NDATA' S Name
 | |
|  *
 | |
|  * [ VC: Notation Declared ]
 | |
|  * The Name must match the declared name of a notation.
 | |
|  */
 | |
| 
 | |
| void
 | |
| xmlParseEntityDecl(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *name = NULL;
 | |
|     xmlChar *value = NULL;
 | |
|     xmlChar *URI = NULL, *literal = NULL;
 | |
|     const xmlChar *ndata = NULL;
 | |
|     int isParameter = 0;
 | |
|     xmlChar *orig = NULL;
 | |
| 
 | |
|     if ((CUR != '<') || (NXT(1) != '!'))
 | |
|         return;
 | |
|     SKIP(2);
 | |
| 
 | |
|     /* GROW; done in the caller */
 | |
|     if (CMP6(CUR_PTR, 'E', 'N', 'T', 'I', 'T', 'Y')) {
 | |
| 	int inputid = ctxt->input->id;
 | |
| 	SKIP(6);
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			   "Space required after '<!ENTITY'\n");
 | |
| 	}
 | |
| 
 | |
| 	if (RAW == '%') {
 | |
| 	    NEXT;
 | |
| 	    if (SKIP_BLANKS == 0) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			       "Space required after '%%'\n");
 | |
| 	    }
 | |
| 	    isParameter = 1;
 | |
| 	}
 | |
| 
 | |
|         name = xmlParseName(ctxt);
 | |
| 	if (name == NULL) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 	                   "xmlParseEntityDecl: no name\n");
 | |
|             return;
 | |
| 	}
 | |
| 	if (xmlStrchr(name, ':') != NULL) {
 | |
| 	    xmlNsErr(ctxt, XML_NS_ERR_COLON,
 | |
| 		     "colons are forbidden from entities names '%s'\n",
 | |
| 		     name, NULL, NULL);
 | |
| 	}
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			   "Space required after the entity name\n");
 | |
| 	}
 | |
| 
 | |
| 	ctxt->instate = XML_PARSER_ENTITY_DECL;
 | |
| 	/*
 | |
| 	 * handle the various case of definitions...
 | |
| 	 */
 | |
| 	if (isParameter) {
 | |
| 	    if ((RAW == '"') || (RAW == '\'')) {
 | |
| 	        value = xmlParseEntityValue(ctxt, &orig);
 | |
| 		if (value) {
 | |
| 		    if ((ctxt->sax != NULL) &&
 | |
| 			(!ctxt->disableSAX) && (ctxt->sax->entityDecl != NULL))
 | |
| 			ctxt->sax->entityDecl(ctxt->userData, name,
 | |
| 		                    XML_INTERNAL_PARAMETER_ENTITY,
 | |
| 				    NULL, NULL, value);
 | |
| 		}
 | |
| 	    } else {
 | |
| 	        URI = xmlParseExternalID(ctxt, &literal, 1);
 | |
| 		if ((URI == NULL) && (literal == NULL)) {
 | |
| 		    xmlFatalErr(ctxt, XML_ERR_VALUE_REQUIRED, NULL);
 | |
| 		}
 | |
| 		if (URI) {
 | |
| 		    xmlURIPtr uri;
 | |
| 
 | |
| 		    uri = xmlParseURI((const char *) URI);
 | |
| 		    if (uri == NULL) {
 | |
| 		        xmlErrMsgStr(ctxt, XML_ERR_INVALID_URI,
 | |
| 				     "Invalid URI: %s\n", URI);
 | |
| 			/*
 | |
| 			 * This really ought to be a well formedness error
 | |
| 			 * but the XML Core WG decided otherwise c.f. issue
 | |
| 			 * E26 of the XML erratas.
 | |
| 			 */
 | |
| 		    } else {
 | |
| 			if (uri->fragment != NULL) {
 | |
| 			    /*
 | |
| 			     * Okay this is foolish to block those but not
 | |
| 			     * invalid URIs.
 | |
| 			     */
 | |
| 			    xmlFatalErr(ctxt, XML_ERR_URI_FRAGMENT, NULL);
 | |
| 			} else {
 | |
| 			    if ((ctxt->sax != NULL) &&
 | |
| 				(!ctxt->disableSAX) &&
 | |
| 				(ctxt->sax->entityDecl != NULL))
 | |
| 				ctxt->sax->entityDecl(ctxt->userData, name,
 | |
| 					    XML_EXTERNAL_PARAMETER_ENTITY,
 | |
| 					    literal, URI, NULL);
 | |
| 			}
 | |
| 			xmlFreeURI(uri);
 | |
| 		    }
 | |
| 		}
 | |
| 	    }
 | |
| 	} else {
 | |
| 	    if ((RAW == '"') || (RAW == '\'')) {
 | |
| 	        value = xmlParseEntityValue(ctxt, &orig);
 | |
| 		if ((ctxt->sax != NULL) &&
 | |
| 		    (!ctxt->disableSAX) && (ctxt->sax->entityDecl != NULL))
 | |
| 		    ctxt->sax->entityDecl(ctxt->userData, name,
 | |
| 				XML_INTERNAL_GENERAL_ENTITY,
 | |
| 				NULL, NULL, value);
 | |
| 		/*
 | |
| 		 * For expat compatibility in SAX mode.
 | |
| 		 */
 | |
| 		if ((ctxt->myDoc == NULL) ||
 | |
| 		    (xmlStrEqual(ctxt->myDoc->version, SAX_COMPAT_MODE))) {
 | |
| 		    if (ctxt->myDoc == NULL) {
 | |
| 			ctxt->myDoc = xmlNewDoc(SAX_COMPAT_MODE);
 | |
| 			if (ctxt->myDoc == NULL) {
 | |
| 			    xmlErrMemory(ctxt, "New Doc failed");
 | |
| 			    goto done;
 | |
| 			}
 | |
| 			ctxt->myDoc->properties = XML_DOC_INTERNAL;
 | |
| 		    }
 | |
| 		    if (ctxt->myDoc->intSubset == NULL)
 | |
| 			ctxt->myDoc->intSubset = xmlNewDtd(ctxt->myDoc,
 | |
| 					    BAD_CAST "fake", NULL, NULL);
 | |
| 
 | |
| 		    xmlSAX2EntityDecl(ctxt, name, XML_INTERNAL_GENERAL_ENTITY,
 | |
| 			              NULL, NULL, value);
 | |
| 		}
 | |
| 	    } else {
 | |
| 	        URI = xmlParseExternalID(ctxt, &literal, 1);
 | |
| 		if ((URI == NULL) && (literal == NULL)) {
 | |
| 		    xmlFatalErr(ctxt, XML_ERR_VALUE_REQUIRED, NULL);
 | |
| 		}
 | |
| 		if (URI) {
 | |
| 		    xmlURIPtr uri;
 | |
| 
 | |
| 		    uri = xmlParseURI((const char *)URI);
 | |
| 		    if (uri == NULL) {
 | |
| 		        xmlErrMsgStr(ctxt, XML_ERR_INVALID_URI,
 | |
| 				     "Invalid URI: %s\n", URI);
 | |
| 			/*
 | |
| 			 * This really ought to be a well formedness error
 | |
| 			 * but the XML Core WG decided otherwise c.f. issue
 | |
| 			 * E26 of the XML erratas.
 | |
| 			 */
 | |
| 		    } else {
 | |
| 			if (uri->fragment != NULL) {
 | |
| 			    /*
 | |
| 			     * Okay this is foolish to block those but not
 | |
| 			     * invalid URIs.
 | |
| 			     */
 | |
| 			    xmlFatalErr(ctxt, XML_ERR_URI_FRAGMENT, NULL);
 | |
| 			}
 | |
| 			xmlFreeURI(uri);
 | |
| 		    }
 | |
| 		}
 | |
| 		if ((RAW != '>') && (SKIP_BLANKS == 0)) {
 | |
| 		    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 				   "Space required before 'NDATA'\n");
 | |
| 		}
 | |
| 		if (CMP5(CUR_PTR, 'N', 'D', 'A', 'T', 'A')) {
 | |
| 		    SKIP(5);
 | |
| 		    if (SKIP_BLANKS == 0) {
 | |
| 			xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 				       "Space required after 'NDATA'\n");
 | |
| 		    }
 | |
| 		    ndata = xmlParseName(ctxt);
 | |
| 		    if ((ctxt->sax != NULL) && (!ctxt->disableSAX) &&
 | |
| 		        (ctxt->sax->unparsedEntityDecl != NULL))
 | |
| 			ctxt->sax->unparsedEntityDecl(ctxt->userData, name,
 | |
| 				    literal, URI, ndata);
 | |
| 		} else {
 | |
| 		    if ((ctxt->sax != NULL) &&
 | |
| 		        (!ctxt->disableSAX) && (ctxt->sax->entityDecl != NULL))
 | |
| 			ctxt->sax->entityDecl(ctxt->userData, name,
 | |
| 				    XML_EXTERNAL_GENERAL_PARSED_ENTITY,
 | |
| 				    literal, URI, NULL);
 | |
| 		    /*
 | |
| 		     * For expat compatibility in SAX mode.
 | |
| 		     * assuming the entity replacement was asked for
 | |
| 		     */
 | |
| 		    if ((ctxt->replaceEntities != 0) &&
 | |
| 			((ctxt->myDoc == NULL) ||
 | |
| 			(xmlStrEqual(ctxt->myDoc->version, SAX_COMPAT_MODE)))) {
 | |
| 			if (ctxt->myDoc == NULL) {
 | |
| 			    ctxt->myDoc = xmlNewDoc(SAX_COMPAT_MODE);
 | |
| 			    if (ctxt->myDoc == NULL) {
 | |
| 			        xmlErrMemory(ctxt, "New Doc failed");
 | |
| 				goto done;
 | |
| 			    }
 | |
| 			    ctxt->myDoc->properties = XML_DOC_INTERNAL;
 | |
| 			}
 | |
| 
 | |
| 			if (ctxt->myDoc->intSubset == NULL)
 | |
| 			    ctxt->myDoc->intSubset = xmlNewDtd(ctxt->myDoc,
 | |
| 						BAD_CAST "fake", NULL, NULL);
 | |
| 			xmlSAX2EntityDecl(ctxt, name,
 | |
| 				          XML_EXTERNAL_GENERAL_PARSED_ENTITY,
 | |
| 				          literal, URI, NULL);
 | |
| 		    }
 | |
| 		}
 | |
| 	    }
 | |
| 	}
 | |
| 	if (ctxt->instate == XML_PARSER_EOF)
 | |
| 	    goto done;
 | |
| 	SKIP_BLANKS;
 | |
| 	if (RAW != '>') {
 | |
| 	    xmlFatalErrMsgStr(ctxt, XML_ERR_ENTITY_NOT_FINISHED,
 | |
| 	            "xmlParseEntityDecl: entity %s not terminated\n", name);
 | |
| 	    xmlHaltParser(ctxt);
 | |
| 	} else {
 | |
| 	    if (inputid != ctxt->input->id) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
| 	                       "Entity declaration doesn't start and stop in"
 | |
|                                " the same entity\n");
 | |
| 	    }
 | |
| 	    NEXT;
 | |
| 	}
 | |
| 	if (orig != NULL) {
 | |
| 	    /*
 | |
| 	     * Ugly mechanism to save the raw entity value.
 | |
| 	     */
 | |
| 	    xmlEntityPtr cur = NULL;
 | |
| 
 | |
| 	    if (isParameter) {
 | |
| 	        if ((ctxt->sax != NULL) &&
 | |
| 		    (ctxt->sax->getParameterEntity != NULL))
 | |
| 		    cur = ctxt->sax->getParameterEntity(ctxt->userData, name);
 | |
| 	    } else {
 | |
| 	        if ((ctxt->sax != NULL) &&
 | |
| 		    (ctxt->sax->getEntity != NULL))
 | |
| 		    cur = ctxt->sax->getEntity(ctxt->userData, name);
 | |
| 		if ((cur == NULL) && (ctxt->userData==ctxt)) {
 | |
| 		    cur = xmlSAX2GetEntity(ctxt, name);
 | |
| 		}
 | |
| 	    }
 | |
|             if ((cur != NULL) && (cur->orig == NULL)) {
 | |
| 		cur->orig = orig;
 | |
|                 orig = NULL;
 | |
| 	    }
 | |
| 	}
 | |
| 
 | |
| done:
 | |
| 	if (value != NULL) xmlFree(value);
 | |
| 	if (URI != NULL) xmlFree(URI);
 | |
| 	if (literal != NULL) xmlFree(literal);
 | |
|         if (orig != NULL) xmlFree(orig);
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseDefaultDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @value:  Receive a possible fixed default value for the attribute
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse an attribute default declaration
 | |
|  *
 | |
|  * [60] DefaultDecl ::= '#REQUIRED' | '#IMPLIED' | (('#FIXED' S)? AttValue)
 | |
|  *
 | |
|  * [ VC: Required Attribute ]
 | |
|  * if the default declaration is the keyword #REQUIRED, then the
 | |
|  * attribute must be specified for all elements of the type in the
 | |
|  * attribute-list declaration.
 | |
|  *
 | |
|  * [ VC: Attribute Default Legal ]
 | |
|  * The declared default value must meet the lexical constraints of
 | |
|  * the declared attribute type c.f. xmlValidateAttributeDecl()
 | |
|  *
 | |
|  * [ VC: Fixed Attribute Default ]
 | |
|  * if an attribute has a default value declared with the #FIXED
 | |
|  * keyword, instances of that attribute must match the default value.
 | |
|  *
 | |
|  * [ WFC: No < in Attribute Values ]
 | |
|  * handled in xmlParseAttValue()
 | |
|  *
 | |
|  * returns: XML_ATTRIBUTE_NONE, XML_ATTRIBUTE_REQUIRED, XML_ATTRIBUTE_IMPLIED
 | |
|  *          or XML_ATTRIBUTE_FIXED.
 | |
|  */
 | |
| 
 | |
| int
 | |
| xmlParseDefaultDecl(xmlParserCtxtPtr ctxt, xmlChar **value) {
 | |
|     int val;
 | |
|     xmlChar *ret;
 | |
| 
 | |
|     *value = NULL;
 | |
|     if (CMP9(CUR_PTR, '#', 'R', 'E', 'Q', 'U', 'I', 'R', 'E', 'D')) {
 | |
| 	SKIP(9);
 | |
| 	return(XML_ATTRIBUTE_REQUIRED);
 | |
|     }
 | |
|     if (CMP8(CUR_PTR, '#', 'I', 'M', 'P', 'L', 'I', 'E', 'D')) {
 | |
| 	SKIP(8);
 | |
| 	return(XML_ATTRIBUTE_IMPLIED);
 | |
|     }
 | |
|     val = XML_ATTRIBUTE_NONE;
 | |
|     if (CMP6(CUR_PTR, '#', 'F', 'I', 'X', 'E', 'D')) {
 | |
| 	SKIP(6);
 | |
| 	val = XML_ATTRIBUTE_FIXED;
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			   "Space required after '#FIXED'\n");
 | |
| 	}
 | |
|     }
 | |
|     ret = xmlParseAttValue(ctxt);
 | |
|     ctxt->instate = XML_PARSER_DTD;
 | |
|     if (ret == NULL) {
 | |
| 	xmlFatalErrMsg(ctxt, (xmlParserErrors)ctxt->errNo,
 | |
| 		       "Attribute default value declaration error\n");
 | |
|     } else
 | |
|         *value = ret;
 | |
|     return(val);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseNotationType:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an Notation attribute type.
 | |
|  *
 | |
|  * Note: the leading 'NOTATION' S part has already being parsed...
 | |
|  *
 | |
|  * [58] NotationType ::= 'NOTATION' S '(' S? Name (S? '|' S? Name)* S? ')'
 | |
|  *
 | |
|  * [ VC: Notation Attributes ]
 | |
|  * Values of this type must match one of the notation names included
 | |
|  * in the declaration; all notation names in the declaration must be declared.
 | |
|  *
 | |
|  * Returns: the notation attribute tree built while parsing
 | |
|  */
 | |
| 
 | |
| xmlEnumerationPtr
 | |
| xmlParseNotationType(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *name;
 | |
|     xmlEnumerationPtr ret = NULL, last = NULL, cur, tmp;
 | |
| 
 | |
|     if (RAW != '(') {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_NOTATION_NOT_STARTED, NULL);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     do {
 | |
|         NEXT;
 | |
| 	SKIP_BLANKS;
 | |
|         name = xmlParseName(ctxt);
 | |
| 	if (name == NULL) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 			   "Name expected in NOTATION declaration\n");
 | |
|             xmlFreeEnumeration(ret);
 | |
| 	    return(NULL);
 | |
| 	}
 | |
| 	tmp = ret;
 | |
| 	while (tmp != NULL) {
 | |
| 	    if (xmlStrEqual(name, tmp->name)) {
 | |
| 		xmlValidityError(ctxt, XML_DTD_DUP_TOKEN,
 | |
| 	  "standalone: attribute notation value token %s duplicated\n",
 | |
| 				 name, NULL);
 | |
| 		if (!xmlDictOwns(ctxt->dict, name))
 | |
| 		    xmlFree((xmlChar *) name);
 | |
| 		break;
 | |
| 	    }
 | |
| 	    tmp = tmp->next;
 | |
| 	}
 | |
| 	if (tmp == NULL) {
 | |
| 	    cur = xmlCreateEnumeration(name);
 | |
| 	    if (cur == NULL) {
 | |
|                 xmlFreeEnumeration(ret);
 | |
|                 return(NULL);
 | |
|             }
 | |
| 	    if (last == NULL) ret = last = cur;
 | |
| 	    else {
 | |
| 		last->next = cur;
 | |
| 		last = cur;
 | |
| 	    }
 | |
| 	}
 | |
| 	SKIP_BLANKS;
 | |
|     } while (RAW == '|');
 | |
|     if (RAW != ')') {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_NOTATION_NOT_FINISHED, NULL);
 | |
|         xmlFreeEnumeration(ret);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     NEXT;
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseEnumerationType:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an Enumeration attribute type.
 | |
|  *
 | |
|  * [59] Enumeration ::= '(' S? Nmtoken (S? '|' S? Nmtoken)* S? ')'
 | |
|  *
 | |
|  * [ VC: Enumeration ]
 | |
|  * Values of this type must match one of the Nmtoken tokens in
 | |
|  * the declaration
 | |
|  *
 | |
|  * Returns: the enumeration attribute tree built while parsing
 | |
|  */
 | |
| 
 | |
| xmlEnumerationPtr
 | |
| xmlParseEnumerationType(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar *name;
 | |
|     xmlEnumerationPtr ret = NULL, last = NULL, cur, tmp;
 | |
| 
 | |
|     if (RAW != '(') {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_ATTLIST_NOT_STARTED, NULL);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     do {
 | |
|         NEXT;
 | |
| 	SKIP_BLANKS;
 | |
|         name = xmlParseNmtoken(ctxt);
 | |
| 	if (name == NULL) {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_NMTOKEN_REQUIRED, NULL);
 | |
| 	    return(ret);
 | |
| 	}
 | |
| 	tmp = ret;
 | |
| 	while (tmp != NULL) {
 | |
| 	    if (xmlStrEqual(name, tmp->name)) {
 | |
| 		xmlValidityError(ctxt, XML_DTD_DUP_TOKEN,
 | |
| 	  "standalone: attribute enumeration value token %s duplicated\n",
 | |
| 				 name, NULL);
 | |
| 		if (!xmlDictOwns(ctxt->dict, name))
 | |
| 		    xmlFree(name);
 | |
| 		break;
 | |
| 	    }
 | |
| 	    tmp = tmp->next;
 | |
| 	}
 | |
| 	if (tmp == NULL) {
 | |
| 	    cur = xmlCreateEnumeration(name);
 | |
| 	    if (!xmlDictOwns(ctxt->dict, name))
 | |
| 		xmlFree(name);
 | |
| 	    if (cur == NULL) {
 | |
|                 xmlFreeEnumeration(ret);
 | |
|                 return(NULL);
 | |
|             }
 | |
| 	    if (last == NULL) ret = last = cur;
 | |
| 	    else {
 | |
| 		last->next = cur;
 | |
| 		last = cur;
 | |
| 	    }
 | |
| 	}
 | |
| 	SKIP_BLANKS;
 | |
|     } while (RAW == '|');
 | |
|     if (RAW != ')') {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_ATTLIST_NOT_FINISHED, NULL);
 | |
| 	return(ret);
 | |
|     }
 | |
|     NEXT;
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseEnumeratedType:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @tree:  the enumeration tree built while parsing
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an Enumerated attribute type.
 | |
|  *
 | |
|  * [57] EnumeratedType ::= NotationType | Enumeration
 | |
|  *
 | |
|  * [58] NotationType ::= 'NOTATION' S '(' S? Name (S? '|' S? Name)* S? ')'
 | |
|  *
 | |
|  *
 | |
|  * Returns: XML_ATTRIBUTE_ENUMERATION or XML_ATTRIBUTE_NOTATION
 | |
|  */
 | |
| 
 | |
| int
 | |
| xmlParseEnumeratedType(xmlParserCtxtPtr ctxt, xmlEnumerationPtr *tree) {
 | |
|     if (CMP8(CUR_PTR, 'N', 'O', 'T', 'A', 'T', 'I', 'O', 'N')) {
 | |
| 	SKIP(8);
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			   "Space required after 'NOTATION'\n");
 | |
| 	    return(0);
 | |
| 	}
 | |
| 	*tree = xmlParseNotationType(ctxt);
 | |
| 	if (*tree == NULL) return(0);
 | |
| 	return(XML_ATTRIBUTE_NOTATION);
 | |
|     }
 | |
|     *tree = xmlParseEnumerationType(ctxt);
 | |
|     if (*tree == NULL) return(0);
 | |
|     return(XML_ATTRIBUTE_ENUMERATION);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseAttributeType:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @tree:  the enumeration tree built while parsing
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse the Attribute list def for an element
 | |
|  *
 | |
|  * [54] AttType ::= StringType | TokenizedType | EnumeratedType
 | |
|  *
 | |
|  * [55] StringType ::= 'CDATA'
 | |
|  *
 | |
|  * [56] TokenizedType ::= 'ID' | 'IDREF' | 'IDREFS' | 'ENTITY' |
 | |
|  *                        'ENTITIES' | 'NMTOKEN' | 'NMTOKENS'
 | |
|  *
 | |
|  * Validity constraints for attribute values syntax are checked in
 | |
|  * xmlValidateAttributeValue()
 | |
|  *
 | |
|  * [ VC: ID ]
 | |
|  * Values of type ID must match the Name production. A name must not
 | |
|  * appear more than once in an XML document as a value of this type;
 | |
|  * i.e., ID values must uniquely identify the elements which bear them.
 | |
|  *
 | |
|  * [ VC: One ID per Element Type ]
 | |
|  * No element type may have more than one ID attribute specified.
 | |
|  *
 | |
|  * [ VC: ID Attribute Default ]
 | |
|  * An ID attribute must have a declared default of #IMPLIED or #REQUIRED.
 | |
|  *
 | |
|  * [ VC: IDREF ]
 | |
|  * Values of type IDREF must match the Name production, and values
 | |
|  * of type IDREFS must match Names; each IDREF Name must match the value
 | |
|  * of an ID attribute on some element in the XML document; i.e. IDREF
 | |
|  * values must match the value of some ID attribute.
 | |
|  *
 | |
|  * [ VC: Entity Name ]
 | |
|  * Values of type ENTITY must match the Name production, values
 | |
|  * of type ENTITIES must match Names; each Entity Name must match the
 | |
|  * name of an unparsed entity declared in the DTD.
 | |
|  *
 | |
|  * [ VC: Name Token ]
 | |
|  * Values of type NMTOKEN must match the Nmtoken production; values
 | |
|  * of type NMTOKENS must match Nmtokens.
 | |
|  *
 | |
|  * Returns the attribute type
 | |
|  */
 | |
| int
 | |
| xmlParseAttributeType(xmlParserCtxtPtr ctxt, xmlEnumerationPtr *tree) {
 | |
|     if (CMP5(CUR_PTR, 'C', 'D', 'A', 'T', 'A')) {
 | |
| 	SKIP(5);
 | |
| 	return(XML_ATTRIBUTE_CDATA);
 | |
|      } else if (CMP6(CUR_PTR, 'I', 'D', 'R', 'E', 'F', 'S')) {
 | |
| 	SKIP(6);
 | |
| 	return(XML_ATTRIBUTE_IDREFS);
 | |
|      } else if (CMP5(CUR_PTR, 'I', 'D', 'R', 'E', 'F')) {
 | |
| 	SKIP(5);
 | |
| 	return(XML_ATTRIBUTE_IDREF);
 | |
|      } else if ((RAW == 'I') && (NXT(1) == 'D')) {
 | |
|         SKIP(2);
 | |
| 	return(XML_ATTRIBUTE_ID);
 | |
|      } else if (CMP6(CUR_PTR, 'E', 'N', 'T', 'I', 'T', 'Y')) {
 | |
| 	SKIP(6);
 | |
| 	return(XML_ATTRIBUTE_ENTITY);
 | |
|      } else if (CMP8(CUR_PTR, 'E', 'N', 'T', 'I', 'T', 'I', 'E', 'S')) {
 | |
| 	SKIP(8);
 | |
| 	return(XML_ATTRIBUTE_ENTITIES);
 | |
|      } else if (CMP8(CUR_PTR, 'N', 'M', 'T', 'O', 'K', 'E', 'N', 'S')) {
 | |
| 	SKIP(8);
 | |
| 	return(XML_ATTRIBUTE_NMTOKENS);
 | |
|      } else if (CMP7(CUR_PTR, 'N', 'M', 'T', 'O', 'K', 'E', 'N')) {
 | |
| 	SKIP(7);
 | |
| 	return(XML_ATTRIBUTE_NMTOKEN);
 | |
|      }
 | |
|      return(xmlParseEnumeratedType(ctxt, tree));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseAttributeListDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse an attribute list declaration for an element. Always consumes '<!'.
 | |
|  *
 | |
|  * [52] AttlistDecl ::= '<!ATTLIST' S Name AttDef* S? '>'
 | |
|  *
 | |
|  * [53] AttDef ::= S Name S AttType S DefaultDecl
 | |
|  *
 | |
|  */
 | |
| void
 | |
| xmlParseAttributeListDecl(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *elemName;
 | |
|     const xmlChar *attrName;
 | |
|     xmlEnumerationPtr tree;
 | |
| 
 | |
|     if ((CUR != '<') || (NXT(1) != '!'))
 | |
|         return;
 | |
|     SKIP(2);
 | |
| 
 | |
|     if (CMP7(CUR_PTR, 'A', 'T', 'T', 'L', 'I', 'S', 'T')) {
 | |
| 	int inputid = ctxt->input->id;
 | |
| 
 | |
| 	SKIP(7);
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 		                 "Space required after '<!ATTLIST'\n");
 | |
| 	}
 | |
|         elemName = xmlParseName(ctxt);
 | |
| 	if (elemName == NULL) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 			   "ATTLIST: no name for Element\n");
 | |
| 	    return;
 | |
| 	}
 | |
| 	SKIP_BLANKS;
 | |
| 	GROW;
 | |
| 	while ((RAW != '>') && (ctxt->instate != XML_PARSER_EOF)) {
 | |
| 	    int type;
 | |
| 	    int def;
 | |
| 	    xmlChar *defaultValue = NULL;
 | |
| 
 | |
| 	    GROW;
 | |
|             tree = NULL;
 | |
| 	    attrName = xmlParseName(ctxt);
 | |
| 	    if (attrName == NULL) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 			       "ATTLIST: no name for Attribute\n");
 | |
| 		break;
 | |
| 	    }
 | |
| 	    GROW;
 | |
| 	    if (SKIP_BLANKS == 0) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 		        "Space required after the attribute name\n");
 | |
| 		break;
 | |
| 	    }
 | |
| 
 | |
| 	    type = xmlParseAttributeType(ctxt, &tree);
 | |
| 	    if (type <= 0) {
 | |
| 	        break;
 | |
| 	    }
 | |
| 
 | |
| 	    GROW;
 | |
| 	    if (SKIP_BLANKS == 0) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			       "Space required after the attribute type\n");
 | |
| 	        if (tree != NULL)
 | |
| 		    xmlFreeEnumeration(tree);
 | |
| 		break;
 | |
| 	    }
 | |
| 
 | |
| 	    def = xmlParseDefaultDecl(ctxt, &defaultValue);
 | |
| 	    if (def <= 0) {
 | |
|                 if (defaultValue != NULL)
 | |
| 		    xmlFree(defaultValue);
 | |
| 	        if (tree != NULL)
 | |
| 		    xmlFreeEnumeration(tree);
 | |
| 	        break;
 | |
| 	    }
 | |
| 	    if ((type != XML_ATTRIBUTE_CDATA) && (defaultValue != NULL))
 | |
| 	        xmlAttrNormalizeSpace(defaultValue, defaultValue);
 | |
| 
 | |
| 	    GROW;
 | |
|             if (RAW != '>') {
 | |
| 		if (SKIP_BLANKS == 0) {
 | |
| 		    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			"Space required after the attribute default value\n");
 | |
| 		    if (defaultValue != NULL)
 | |
| 			xmlFree(defaultValue);
 | |
| 		    if (tree != NULL)
 | |
| 			xmlFreeEnumeration(tree);
 | |
| 		    break;
 | |
| 		}
 | |
| 	    }
 | |
| 	    if ((ctxt->sax != NULL) && (!ctxt->disableSAX) &&
 | |
| 		(ctxt->sax->attributeDecl != NULL))
 | |
| 		ctxt->sax->attributeDecl(ctxt->userData, elemName, attrName,
 | |
| 	                        type, def, defaultValue, tree);
 | |
| 	    else if (tree != NULL)
 | |
| 		xmlFreeEnumeration(tree);
 | |
| 
 | |
| 	    if ((ctxt->sax2) && (defaultValue != NULL) &&
 | |
| 	        (def != XML_ATTRIBUTE_IMPLIED) &&
 | |
| 		(def != XML_ATTRIBUTE_REQUIRED)) {
 | |
| 		xmlAddDefAttrs(ctxt, elemName, attrName, defaultValue);
 | |
| 	    }
 | |
| 	    if (ctxt->sax2) {
 | |
| 		xmlAddSpecialAttr(ctxt, elemName, attrName, type);
 | |
| 	    }
 | |
| 	    if (defaultValue != NULL)
 | |
| 	        xmlFree(defaultValue);
 | |
| 	    GROW;
 | |
| 	}
 | |
| 	if (RAW == '>') {
 | |
| 	    if (inputid != ctxt->input->id) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
|                                "Attribute list declaration doesn't start and"
 | |
|                                " stop in the same entity\n");
 | |
| 	    }
 | |
| 	    NEXT;
 | |
| 	}
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseElementMixedContentDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @inputchk:  the input used for the current entity, needed for boundary checks
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse the declaration for a Mixed Element content
 | |
|  * The leading '(' and spaces have been skipped in xmlParseElementContentDecl
 | |
|  *
 | |
|  * [51] Mixed ::= '(' S? '#PCDATA' (S? '|' S? Name)* S? ')*' |
 | |
|  *                '(' S? '#PCDATA' S? ')'
 | |
|  *
 | |
|  * [ VC: Proper Group/PE Nesting ] applies to [51] too (see [49])
 | |
|  *
 | |
|  * [ VC: No Duplicate Types ]
 | |
|  * The same name must not appear more than once in a single
 | |
|  * mixed-content declaration.
 | |
|  *
 | |
|  * returns: the list of the xmlElementContentPtr describing the element choices
 | |
|  */
 | |
| xmlElementContentPtr
 | |
| xmlParseElementMixedContentDecl(xmlParserCtxtPtr ctxt, int inputchk) {
 | |
|     xmlElementContentPtr ret = NULL, cur = NULL, n;
 | |
|     const xmlChar *elem = NULL;
 | |
| 
 | |
|     GROW;
 | |
|     if (CMP7(CUR_PTR, '#', 'P', 'C', 'D', 'A', 'T', 'A')) {
 | |
| 	SKIP(7);
 | |
| 	SKIP_BLANKS;
 | |
| 	if (RAW == ')') {
 | |
| 	    if (ctxt->input->id != inputchk) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
|                                "Element content declaration doesn't start and"
 | |
|                                " stop in the same entity\n");
 | |
| 	    }
 | |
| 	    NEXT;
 | |
| 	    ret = xmlNewDocElementContent(ctxt->myDoc, NULL, XML_ELEMENT_CONTENT_PCDATA);
 | |
| 	    if (ret == NULL)
 | |
| 	        return(NULL);
 | |
| 	    if (RAW == '*') {
 | |
| 		ret->ocur = XML_ELEMENT_CONTENT_MULT;
 | |
| 		NEXT;
 | |
| 	    }
 | |
| 	    return(ret);
 | |
| 	}
 | |
| 	if ((RAW == '(') || (RAW == '|')) {
 | |
| 	    ret = cur = xmlNewDocElementContent(ctxt->myDoc, NULL, XML_ELEMENT_CONTENT_PCDATA);
 | |
| 	    if (ret == NULL) return(NULL);
 | |
| 	}
 | |
| 	while ((RAW == '|') && (ctxt->instate != XML_PARSER_EOF)) {
 | |
| 	    NEXT;
 | |
| 	    if (elem == NULL) {
 | |
| 	        ret = xmlNewDocElementContent(ctxt->myDoc, NULL, XML_ELEMENT_CONTENT_OR);
 | |
| 		if (ret == NULL) {
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, cur);
 | |
|                     return(NULL);
 | |
|                 }
 | |
| 		ret->c1 = cur;
 | |
| 		if (cur != NULL)
 | |
| 		    cur->parent = ret;
 | |
| 		cur = ret;
 | |
| 	    } else {
 | |
| 	        n = xmlNewDocElementContent(ctxt->myDoc, NULL, XML_ELEMENT_CONTENT_OR);
 | |
| 		if (n == NULL) {
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, ret);
 | |
|                     return(NULL);
 | |
|                 }
 | |
| 		n->c1 = xmlNewDocElementContent(ctxt->myDoc, elem, XML_ELEMENT_CONTENT_ELEMENT);
 | |
| 		if (n->c1 != NULL)
 | |
| 		    n->c1->parent = n;
 | |
| 	        cur->c2 = n;
 | |
| 		if (n != NULL)
 | |
| 		    n->parent = cur;
 | |
| 		cur = n;
 | |
| 	    }
 | |
| 	    SKIP_BLANKS;
 | |
| 	    elem = xmlParseName(ctxt);
 | |
| 	    if (elem == NULL) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 			"xmlParseElementMixedContentDecl : Name expected\n");
 | |
| 		xmlFreeDocElementContent(ctxt->myDoc, ret);
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    SKIP_BLANKS;
 | |
| 	    GROW;
 | |
| 	}
 | |
| 	if ((RAW == ')') && (NXT(1) == '*')) {
 | |
| 	    if (elem != NULL) {
 | |
| 		cur->c2 = xmlNewDocElementContent(ctxt->myDoc, elem,
 | |
| 		                               XML_ELEMENT_CONTENT_ELEMENT);
 | |
| 		if (cur->c2 != NULL)
 | |
| 		    cur->c2->parent = cur;
 | |
|             }
 | |
|             if (ret != NULL)
 | |
|                 ret->ocur = XML_ELEMENT_CONTENT_MULT;
 | |
| 	    if (ctxt->input->id != inputchk) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
|                                "Element content declaration doesn't start and"
 | |
|                                " stop in the same entity\n");
 | |
| 	    }
 | |
| 	    SKIP(2);
 | |
| 	} else {
 | |
| 	    xmlFreeDocElementContent(ctxt->myDoc, ret);
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_MIXED_NOT_STARTED, NULL);
 | |
| 	    return(NULL);
 | |
| 	}
 | |
| 
 | |
|     } else {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_PCDATA_REQUIRED, NULL);
 | |
|     }
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseElementChildrenContentDeclPriv:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @inputchk:  the input used for the current entity, needed for boundary checks
 | |
|  * @depth: the level of recursion
 | |
|  *
 | |
|  * parse the declaration for a Mixed Element content
 | |
|  * The leading '(' and spaces have been skipped in xmlParseElementContentDecl
 | |
|  *
 | |
|  *
 | |
|  * [47] children ::= (choice | seq) ('?' | '*' | '+')?
 | |
|  *
 | |
|  * [48] cp ::= (Name | choice | seq) ('?' | '*' | '+')?
 | |
|  *
 | |
|  * [49] choice ::= '(' S? cp ( S? '|' S? cp )* S? ')'
 | |
|  *
 | |
|  * [50] seq ::= '(' S? cp ( S? ',' S? cp )* S? ')'
 | |
|  *
 | |
|  * [ VC: Proper Group/PE Nesting ] applies to [49] and [50]
 | |
|  * TODO Parameter-entity replacement text must be properly nested
 | |
|  *	with parenthesized groups. That is to say, if either of the
 | |
|  *	opening or closing parentheses in a choice, seq, or Mixed
 | |
|  *	construct is contained in the replacement text for a parameter
 | |
|  *	entity, both must be contained in the same replacement text. For
 | |
|  *	interoperability, if a parameter-entity reference appears in a
 | |
|  *	choice, seq, or Mixed construct, its replacement text should not
 | |
|  *	be empty, and neither the first nor last non-blank character of
 | |
|  *	the replacement text should be a connector (| or ,).
 | |
|  *
 | |
|  * Returns the tree of xmlElementContentPtr describing the element
 | |
|  *          hierarchy.
 | |
|  */
 | |
| static xmlElementContentPtr
 | |
| xmlParseElementChildrenContentDeclPriv(xmlParserCtxtPtr ctxt, int inputchk,
 | |
|                                        int depth) {
 | |
|     xmlElementContentPtr ret = NULL, cur = NULL, last = NULL, op = NULL;
 | |
|     const xmlChar *elem;
 | |
|     xmlChar type = 0;
 | |
| 
 | |
|     if (((depth > 128) && ((ctxt->options & XML_PARSE_HUGE) == 0)) ||
 | |
|         (depth >  2048)) {
 | |
|         xmlFatalErrMsgInt(ctxt, XML_ERR_ELEMCONTENT_NOT_FINISHED,
 | |
| "xmlParseElementChildrenContentDecl : depth %d too deep, use XML_PARSE_HUGE\n",
 | |
|                           depth);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     SKIP_BLANKS;
 | |
|     GROW;
 | |
|     if (RAW == '(') {
 | |
| 	int inputid = ctxt->input->id;
 | |
| 
 | |
|         /* Recurse on first child */
 | |
| 	NEXT;
 | |
| 	SKIP_BLANKS;
 | |
|         cur = ret = xmlParseElementChildrenContentDeclPriv(ctxt, inputid,
 | |
|                                                            depth + 1);
 | |
|         if (cur == NULL)
 | |
|             return(NULL);
 | |
| 	SKIP_BLANKS;
 | |
| 	GROW;
 | |
|     } else {
 | |
| 	elem = xmlParseName(ctxt);
 | |
| 	if (elem == NULL) {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_ELEMCONTENT_NOT_STARTED, NULL);
 | |
| 	    return(NULL);
 | |
| 	}
 | |
|         cur = ret = xmlNewDocElementContent(ctxt->myDoc, elem, XML_ELEMENT_CONTENT_ELEMENT);
 | |
| 	if (cur == NULL) {
 | |
| 	    xmlErrMemory(ctxt, NULL);
 | |
| 	    return(NULL);
 | |
| 	}
 | |
| 	GROW;
 | |
| 	if (RAW == '?') {
 | |
| 	    cur->ocur = XML_ELEMENT_CONTENT_OPT;
 | |
| 	    NEXT;
 | |
| 	} else if (RAW == '*') {
 | |
| 	    cur->ocur = XML_ELEMENT_CONTENT_MULT;
 | |
| 	    NEXT;
 | |
| 	} else if (RAW == '+') {
 | |
| 	    cur->ocur = XML_ELEMENT_CONTENT_PLUS;
 | |
| 	    NEXT;
 | |
| 	} else {
 | |
| 	    cur->ocur = XML_ELEMENT_CONTENT_ONCE;
 | |
| 	}
 | |
| 	GROW;
 | |
|     }
 | |
|     SKIP_BLANKS;
 | |
|     while ((RAW != ')') && (ctxt->instate != XML_PARSER_EOF)) {
 | |
|         /*
 | |
| 	 * Each loop we parse one separator and one element.
 | |
| 	 */
 | |
|         if (RAW == ',') {
 | |
| 	    if (type == 0) type = CUR;
 | |
| 
 | |
| 	    /*
 | |
| 	     * Detect "Name | Name , Name" error
 | |
| 	     */
 | |
| 	    else if (type != CUR) {
 | |
| 		xmlFatalErrMsgInt(ctxt, XML_ERR_SEPARATOR_REQUIRED,
 | |
| 		    "xmlParseElementChildrenContentDecl : '%c' expected\n",
 | |
| 		                  type);
 | |
| 		if ((last != NULL) && (last != ret))
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, last);
 | |
| 		if (ret != NULL)
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, ret);
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    NEXT;
 | |
| 
 | |
| 	    op = xmlNewDocElementContent(ctxt->myDoc, NULL, XML_ELEMENT_CONTENT_SEQ);
 | |
| 	    if (op == NULL) {
 | |
| 		if ((last != NULL) && (last != ret))
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, last);
 | |
| 	        xmlFreeDocElementContent(ctxt->myDoc, ret);
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    if (last == NULL) {
 | |
| 		op->c1 = ret;
 | |
| 		if (ret != NULL)
 | |
| 		    ret->parent = op;
 | |
| 		ret = cur = op;
 | |
| 	    } else {
 | |
| 	        cur->c2 = op;
 | |
| 		if (op != NULL)
 | |
| 		    op->parent = cur;
 | |
| 		op->c1 = last;
 | |
| 		if (last != NULL)
 | |
| 		    last->parent = op;
 | |
| 		cur =op;
 | |
| 		last = NULL;
 | |
| 	    }
 | |
| 	} else if (RAW == '|') {
 | |
| 	    if (type == 0) type = CUR;
 | |
| 
 | |
| 	    /*
 | |
| 	     * Detect "Name , Name | Name" error
 | |
| 	     */
 | |
| 	    else if (type != CUR) {
 | |
| 		xmlFatalErrMsgInt(ctxt, XML_ERR_SEPARATOR_REQUIRED,
 | |
| 		    "xmlParseElementChildrenContentDecl : '%c' expected\n",
 | |
| 				  type);
 | |
| 		if ((last != NULL) && (last != ret))
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, last);
 | |
| 		if (ret != NULL)
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, ret);
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    NEXT;
 | |
| 
 | |
| 	    op = xmlNewDocElementContent(ctxt->myDoc, NULL, XML_ELEMENT_CONTENT_OR);
 | |
| 	    if (op == NULL) {
 | |
| 		if ((last != NULL) && (last != ret))
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, last);
 | |
| 		if (ret != NULL)
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, ret);
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    if (last == NULL) {
 | |
| 		op->c1 = ret;
 | |
| 		if (ret != NULL)
 | |
| 		    ret->parent = op;
 | |
| 		ret = cur = op;
 | |
| 	    } else {
 | |
| 	        cur->c2 = op;
 | |
| 		if (op != NULL)
 | |
| 		    op->parent = cur;
 | |
| 		op->c1 = last;
 | |
| 		if (last != NULL)
 | |
| 		    last->parent = op;
 | |
| 		cur =op;
 | |
| 		last = NULL;
 | |
| 	    }
 | |
| 	} else {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_ELEMCONTENT_NOT_FINISHED, NULL);
 | |
| 	    if ((last != NULL) && (last != ret))
 | |
| 	        xmlFreeDocElementContent(ctxt->myDoc, last);
 | |
| 	    if (ret != NULL)
 | |
| 		xmlFreeDocElementContent(ctxt->myDoc, ret);
 | |
| 	    return(NULL);
 | |
| 	}
 | |
| 	GROW;
 | |
| 	SKIP_BLANKS;
 | |
| 	GROW;
 | |
| 	if (RAW == '(') {
 | |
| 	    int inputid = ctxt->input->id;
 | |
| 	    /* Recurse on second child */
 | |
| 	    NEXT;
 | |
| 	    SKIP_BLANKS;
 | |
| 	    last = xmlParseElementChildrenContentDeclPriv(ctxt, inputid,
 | |
|                                                           depth + 1);
 | |
|             if (last == NULL) {
 | |
| 		if (ret != NULL)
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, ret);
 | |
| 		return(NULL);
 | |
|             }
 | |
| 	    SKIP_BLANKS;
 | |
| 	} else {
 | |
| 	    elem = xmlParseName(ctxt);
 | |
| 	    if (elem == NULL) {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_ELEMCONTENT_NOT_STARTED, NULL);
 | |
| 		if (ret != NULL)
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, ret);
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    last = xmlNewDocElementContent(ctxt->myDoc, elem, XML_ELEMENT_CONTENT_ELEMENT);
 | |
| 	    if (last == NULL) {
 | |
| 		if (ret != NULL)
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, ret);
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    if (RAW == '?') {
 | |
| 		last->ocur = XML_ELEMENT_CONTENT_OPT;
 | |
| 		NEXT;
 | |
| 	    } else if (RAW == '*') {
 | |
| 		last->ocur = XML_ELEMENT_CONTENT_MULT;
 | |
| 		NEXT;
 | |
| 	    } else if (RAW == '+') {
 | |
| 		last->ocur = XML_ELEMENT_CONTENT_PLUS;
 | |
| 		NEXT;
 | |
| 	    } else {
 | |
| 		last->ocur = XML_ELEMENT_CONTENT_ONCE;
 | |
| 	    }
 | |
| 	}
 | |
| 	SKIP_BLANKS;
 | |
| 	GROW;
 | |
|     }
 | |
|     if ((cur != NULL) && (last != NULL)) {
 | |
|         cur->c2 = last;
 | |
| 	if (last != NULL)
 | |
| 	    last->parent = cur;
 | |
|     }
 | |
|     if (ctxt->input->id != inputchk) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
|                        "Element content declaration doesn't start and stop in"
 | |
|                        " the same entity\n");
 | |
|     }
 | |
|     NEXT;
 | |
|     if (RAW == '?') {
 | |
| 	if (ret != NULL) {
 | |
| 	    if ((ret->ocur == XML_ELEMENT_CONTENT_PLUS) ||
 | |
| 	        (ret->ocur == XML_ELEMENT_CONTENT_MULT))
 | |
| 	        ret->ocur = XML_ELEMENT_CONTENT_MULT;
 | |
| 	    else
 | |
| 	        ret->ocur = XML_ELEMENT_CONTENT_OPT;
 | |
| 	}
 | |
| 	NEXT;
 | |
|     } else if (RAW == '*') {
 | |
| 	if (ret != NULL) {
 | |
| 	    ret->ocur = XML_ELEMENT_CONTENT_MULT;
 | |
| 	    cur = ret;
 | |
| 	    /*
 | |
| 	     * Some normalization:
 | |
| 	     * (a | b* | c?)* == (a | b | c)*
 | |
| 	     */
 | |
| 	    while ((cur != NULL) && (cur->type == XML_ELEMENT_CONTENT_OR)) {
 | |
| 		if ((cur->c1 != NULL) &&
 | |
| 	            ((cur->c1->ocur == XML_ELEMENT_CONTENT_OPT) ||
 | |
| 		     (cur->c1->ocur == XML_ELEMENT_CONTENT_MULT)))
 | |
| 		    cur->c1->ocur = XML_ELEMENT_CONTENT_ONCE;
 | |
| 		if ((cur->c2 != NULL) &&
 | |
| 	            ((cur->c2->ocur == XML_ELEMENT_CONTENT_OPT) ||
 | |
| 		     (cur->c2->ocur == XML_ELEMENT_CONTENT_MULT)))
 | |
| 		    cur->c2->ocur = XML_ELEMENT_CONTENT_ONCE;
 | |
| 		cur = cur->c2;
 | |
| 	    }
 | |
| 	}
 | |
| 	NEXT;
 | |
|     } else if (RAW == '+') {
 | |
| 	if (ret != NULL) {
 | |
| 	    int found = 0;
 | |
| 
 | |
| 	    if ((ret->ocur == XML_ELEMENT_CONTENT_OPT) ||
 | |
| 	        (ret->ocur == XML_ELEMENT_CONTENT_MULT))
 | |
| 	        ret->ocur = XML_ELEMENT_CONTENT_MULT;
 | |
| 	    else
 | |
| 	        ret->ocur = XML_ELEMENT_CONTENT_PLUS;
 | |
| 	    /*
 | |
| 	     * Some normalization:
 | |
| 	     * (a | b*)+ == (a | b)*
 | |
| 	     * (a | b?)+ == (a | b)*
 | |
| 	     */
 | |
| 	    while ((cur != NULL) && (cur->type == XML_ELEMENT_CONTENT_OR)) {
 | |
| 		if ((cur->c1 != NULL) &&
 | |
| 	            ((cur->c1->ocur == XML_ELEMENT_CONTENT_OPT) ||
 | |
| 		     (cur->c1->ocur == XML_ELEMENT_CONTENT_MULT))) {
 | |
| 		    cur->c1->ocur = XML_ELEMENT_CONTENT_ONCE;
 | |
| 		    found = 1;
 | |
| 		}
 | |
| 		if ((cur->c2 != NULL) &&
 | |
| 	            ((cur->c2->ocur == XML_ELEMENT_CONTENT_OPT) ||
 | |
| 		     (cur->c2->ocur == XML_ELEMENT_CONTENT_MULT))) {
 | |
| 		    cur->c2->ocur = XML_ELEMENT_CONTENT_ONCE;
 | |
| 		    found = 1;
 | |
| 		}
 | |
| 		cur = cur->c2;
 | |
| 	    }
 | |
| 	    if (found)
 | |
| 		ret->ocur = XML_ELEMENT_CONTENT_MULT;
 | |
| 	}
 | |
| 	NEXT;
 | |
|     }
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseElementChildrenContentDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @inputchk:  the input used for the current entity, needed for boundary checks
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse the declaration for a Mixed Element content
 | |
|  * The leading '(' and spaces have been skipped in xmlParseElementContentDecl
 | |
|  *
 | |
|  * [47] children ::= (choice | seq) ('?' | '*' | '+')?
 | |
|  *
 | |
|  * [48] cp ::= (Name | choice | seq) ('?' | '*' | '+')?
 | |
|  *
 | |
|  * [49] choice ::= '(' S? cp ( S? '|' S? cp )* S? ')'
 | |
|  *
 | |
|  * [50] seq ::= '(' S? cp ( S? ',' S? cp )* S? ')'
 | |
|  *
 | |
|  * [ VC: Proper Group/PE Nesting ] applies to [49] and [50]
 | |
|  * TODO Parameter-entity replacement text must be properly nested
 | |
|  *	with parenthesized groups. That is to say, if either of the
 | |
|  *	opening or closing parentheses in a choice, seq, or Mixed
 | |
|  *	construct is contained in the replacement text for a parameter
 | |
|  *	entity, both must be contained in the same replacement text. For
 | |
|  *	interoperability, if a parameter-entity reference appears in a
 | |
|  *	choice, seq, or Mixed construct, its replacement text should not
 | |
|  *	be empty, and neither the first nor last non-blank character of
 | |
|  *	the replacement text should be a connector (| or ,).
 | |
|  *
 | |
|  * Returns the tree of xmlElementContentPtr describing the element
 | |
|  *          hierarchy.
 | |
|  */
 | |
| xmlElementContentPtr
 | |
| xmlParseElementChildrenContentDecl(xmlParserCtxtPtr ctxt, int inputchk) {
 | |
|     /* stub left for API/ABI compat */
 | |
|     return(xmlParseElementChildrenContentDeclPriv(ctxt, inputchk, 1));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseElementContentDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @name:  the name of the element being defined.
 | |
|  * @result:  the Element Content pointer will be stored here if any
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse the declaration for an Element content either Mixed or Children,
 | |
|  * the cases EMPTY and ANY are handled directly in xmlParseElementDecl
 | |
|  *
 | |
|  * [46] contentspec ::= 'EMPTY' | 'ANY' | Mixed | children
 | |
|  *
 | |
|  * returns: the type of element content XML_ELEMENT_TYPE_xxx
 | |
|  */
 | |
| 
 | |
| int
 | |
| xmlParseElementContentDecl(xmlParserCtxtPtr ctxt, const xmlChar *name,
 | |
|                            xmlElementContentPtr *result) {
 | |
| 
 | |
|     xmlElementContentPtr tree = NULL;
 | |
|     int inputid = ctxt->input->id;
 | |
|     int res;
 | |
| 
 | |
|     *result = NULL;
 | |
| 
 | |
|     if (RAW != '(') {
 | |
| 	xmlFatalErrMsgStr(ctxt, XML_ERR_ELEMCONTENT_NOT_STARTED,
 | |
| 		"xmlParseElementContentDecl : %s '(' expected\n", name);
 | |
| 	return(-1);
 | |
|     }
 | |
|     NEXT;
 | |
|     GROW;
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return(-1);
 | |
|     SKIP_BLANKS;
 | |
|     if (CMP7(CUR_PTR, '#', 'P', 'C', 'D', 'A', 'T', 'A')) {
 | |
|         tree = xmlParseElementMixedContentDecl(ctxt, inputid);
 | |
| 	res = XML_ELEMENT_TYPE_MIXED;
 | |
|     } else {
 | |
|         tree = xmlParseElementChildrenContentDeclPriv(ctxt, inputid, 1);
 | |
| 	res = XML_ELEMENT_TYPE_ELEMENT;
 | |
|     }
 | |
|     SKIP_BLANKS;
 | |
|     *result = tree;
 | |
|     return(res);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseElementDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse an element declaration. Always consumes '<!'.
 | |
|  *
 | |
|  * [45] elementdecl ::= '<!ELEMENT' S Name S contentspec S? '>'
 | |
|  *
 | |
|  * [ VC: Unique Element Type Declaration ]
 | |
|  * No element type may be declared more than once
 | |
|  *
 | |
|  * Returns the type of the element, or -1 in case of error
 | |
|  */
 | |
| int
 | |
| xmlParseElementDecl(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *name;
 | |
|     int ret = -1;
 | |
|     xmlElementContentPtr content  = NULL;
 | |
| 
 | |
|     if ((CUR != '<') || (NXT(1) != '!'))
 | |
|         return(ret);
 | |
|     SKIP(2);
 | |
| 
 | |
|     /* GROW; done in the caller */
 | |
|     if (CMP7(CUR_PTR, 'E', 'L', 'E', 'M', 'E', 'N', 'T')) {
 | |
| 	int inputid = ctxt->input->id;
 | |
| 
 | |
| 	SKIP(7);
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 		           "Space required after 'ELEMENT'\n");
 | |
| 	    return(-1);
 | |
| 	}
 | |
|         name = xmlParseName(ctxt);
 | |
| 	if (name == NULL) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 			   "xmlParseElementDecl: no name for Element\n");
 | |
| 	    return(-1);
 | |
| 	}
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			   "Space required after the element name\n");
 | |
| 	}
 | |
| 	if (CMP5(CUR_PTR, 'E', 'M', 'P', 'T', 'Y')) {
 | |
| 	    SKIP(5);
 | |
| 	    /*
 | |
| 	     * Element must always be empty.
 | |
| 	     */
 | |
| 	    ret = XML_ELEMENT_TYPE_EMPTY;
 | |
| 	} else if ((RAW == 'A') && (NXT(1) == 'N') &&
 | |
| 	           (NXT(2) == 'Y')) {
 | |
| 	    SKIP(3);
 | |
| 	    /*
 | |
| 	     * Element is a generic container.
 | |
| 	     */
 | |
| 	    ret = XML_ELEMENT_TYPE_ANY;
 | |
| 	} else if (RAW == '(') {
 | |
| 	    ret = xmlParseElementContentDecl(ctxt, name, &content);
 | |
| 	} else {
 | |
| 	    /*
 | |
| 	     * [ WFC: PEs in Internal Subset ] error handling.
 | |
| 	     */
 | |
| 	    if ((RAW == '%') && (ctxt->external == 0) &&
 | |
| 	        (ctxt->inputNr == 1)) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_PEREF_IN_INT_SUBSET,
 | |
| 	  "PEReference: forbidden within markup decl in internal subset\n");
 | |
| 	    } else {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_ELEMCONTENT_NOT_STARTED,
 | |
| 		      "xmlParseElementDecl: 'EMPTY', 'ANY' or '(' expected\n");
 | |
|             }
 | |
| 	    return(-1);
 | |
| 	}
 | |
| 
 | |
| 	SKIP_BLANKS;
 | |
| 
 | |
| 	if (RAW != '>') {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_GT_REQUIRED, NULL);
 | |
| 	    if (content != NULL) {
 | |
| 		xmlFreeDocElementContent(ctxt->myDoc, content);
 | |
| 	    }
 | |
| 	} else {
 | |
| 	    if (inputid != ctxt->input->id) {
 | |
| 		xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
|                                "Element declaration doesn't start and stop in"
 | |
|                                " the same entity\n");
 | |
| 	    }
 | |
| 
 | |
| 	    NEXT;
 | |
| 	    if ((ctxt->sax != NULL) && (!ctxt->disableSAX) &&
 | |
| 		(ctxt->sax->elementDecl != NULL)) {
 | |
| 		if (content != NULL)
 | |
| 		    content->parent = NULL;
 | |
| 	        ctxt->sax->elementDecl(ctxt->userData, name, ret,
 | |
| 		                       content);
 | |
| 		if ((content != NULL) && (content->parent == NULL)) {
 | |
| 		    /*
 | |
| 		     * this is a trick: if xmlAddElementDecl is called,
 | |
| 		     * instead of copying the full tree it is plugged directly
 | |
| 		     * if called from the parser. Avoid duplicating the
 | |
| 		     * interfaces or change the API/ABI
 | |
| 		     */
 | |
| 		    xmlFreeDocElementContent(ctxt->myDoc, content);
 | |
| 		}
 | |
| 	    } else if (content != NULL) {
 | |
| 		xmlFreeDocElementContent(ctxt->myDoc, content);
 | |
| 	    }
 | |
| 	}
 | |
|     }
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseConditionalSections
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * Parse a conditional section. Always consumes '<!['.
 | |
|  *
 | |
|  * [61] conditionalSect ::= includeSect | ignoreSect
 | |
|  * [62] includeSect ::= '<![' S? 'INCLUDE' S? '[' extSubsetDecl ']]>'
 | |
|  * [63] ignoreSect ::= '<![' S? 'IGNORE' S? '[' ignoreSectContents* ']]>'
 | |
|  * [64] ignoreSectContents ::= Ignore ('<![' ignoreSectContents ']]>' Ignore)*
 | |
|  * [65] Ignore ::= Char* - (Char* ('<![' | ']]>') Char*)
 | |
|  */
 | |
| 
 | |
| static void
 | |
| xmlParseConditionalSections(xmlParserCtxtPtr ctxt) {
 | |
|     int *inputIds = NULL;
 | |
|     size_t inputIdsSize = 0;
 | |
|     size_t depth = 0;
 | |
| 
 | |
|     while (ctxt->instate != XML_PARSER_EOF) {
 | |
|         if ((RAW == '<') && (NXT(1) == '!') && (NXT(2) == '[')) {
 | |
|             int id = ctxt->input->id;
 | |
| 
 | |
|             SKIP(3);
 | |
|             SKIP_BLANKS;
 | |
| 
 | |
|             if (CMP7(CUR_PTR, 'I', 'N', 'C', 'L', 'U', 'D', 'E')) {
 | |
|                 SKIP(7);
 | |
|                 SKIP_BLANKS;
 | |
|                 if (RAW != '[') {
 | |
|                     xmlFatalErr(ctxt, XML_ERR_CONDSEC_INVALID, NULL);
 | |
|                     xmlHaltParser(ctxt);
 | |
|                     goto error;
 | |
|                 }
 | |
|                 if (ctxt->input->id != id) {
 | |
|                     xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
|                                    "All markup of the conditional section is"
 | |
|                                    " not in the same entity\n");
 | |
|                 }
 | |
|                 NEXT;
 | |
| 
 | |
|                 if (inputIdsSize <= depth) {
 | |
|                     int *tmp;
 | |
| 
 | |
|                     inputIdsSize = (inputIdsSize == 0 ? 4 : inputIdsSize * 2);
 | |
|                     tmp = (int *) xmlRealloc(inputIds,
 | |
|                             inputIdsSize * sizeof(int));
 | |
|                     if (tmp == NULL) {
 | |
|                         xmlErrMemory(ctxt, NULL);
 | |
|                         goto error;
 | |
|                     }
 | |
|                     inputIds = tmp;
 | |
|                 }
 | |
|                 inputIds[depth] = id;
 | |
|                 depth++;
 | |
|             } else if (CMP6(CUR_PTR, 'I', 'G', 'N', 'O', 'R', 'E')) {
 | |
|                 size_t ignoreDepth = 0;
 | |
| 
 | |
|                 SKIP(6);
 | |
|                 SKIP_BLANKS;
 | |
|                 if (RAW != '[') {
 | |
|                     xmlFatalErr(ctxt, XML_ERR_CONDSEC_INVALID, NULL);
 | |
|                     xmlHaltParser(ctxt);
 | |
|                     goto error;
 | |
|                 }
 | |
|                 if (ctxt->input->id != id) {
 | |
|                     xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
|                                    "All markup of the conditional section is"
 | |
|                                    " not in the same entity\n");
 | |
|                 }
 | |
|                 NEXT;
 | |
| 
 | |
|                 while (RAW != 0) {
 | |
|                     if ((RAW == '<') && (NXT(1) == '!') && (NXT(2) == '[')) {
 | |
|                         SKIP(3);
 | |
|                         ignoreDepth++;
 | |
|                         /* Check for integer overflow */
 | |
|                         if (ignoreDepth == 0) {
 | |
|                             xmlErrMemory(ctxt, NULL);
 | |
|                             goto error;
 | |
|                         }
 | |
|                     } else if ((RAW == ']') && (NXT(1) == ']') &&
 | |
|                                (NXT(2) == '>')) {
 | |
|                         if (ignoreDepth == 0)
 | |
|                             break;
 | |
|                         SKIP(3);
 | |
|                         ignoreDepth--;
 | |
|                     } else {
 | |
|                         NEXT;
 | |
|                     }
 | |
|                 }
 | |
| 
 | |
| 		if (RAW == 0) {
 | |
| 		    xmlFatalErr(ctxt, XML_ERR_CONDSEC_NOT_FINISHED, NULL);
 | |
|                     goto error;
 | |
| 		}
 | |
|                 if (ctxt->input->id != id) {
 | |
|                     xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
|                                    "All markup of the conditional section is"
 | |
|                                    " not in the same entity\n");
 | |
|                 }
 | |
|                 SKIP(3);
 | |
|             } else {
 | |
|                 xmlFatalErr(ctxt, XML_ERR_CONDSEC_INVALID_KEYWORD, NULL);
 | |
|                 xmlHaltParser(ctxt);
 | |
|                 goto error;
 | |
|             }
 | |
|         } else if ((depth > 0) &&
 | |
|                    (RAW == ']') && (NXT(1) == ']') && (NXT(2) == '>')) {
 | |
|             depth--;
 | |
|             if (ctxt->input->id != inputIds[depth]) {
 | |
|                 xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,
 | |
|                                "All markup of the conditional section is not"
 | |
|                                " in the same entity\n");
 | |
|             }
 | |
|             SKIP(3);
 | |
|         } else if ((RAW == '<') && ((NXT(1) == '!') || (NXT(1) == '?'))) {
 | |
|             xmlParseMarkupDecl(ctxt);
 | |
|         } else {
 | |
|             xmlFatalErr(ctxt, XML_ERR_EXT_SUBSET_NOT_FINISHED, NULL);
 | |
|             xmlHaltParser(ctxt);
 | |
|             goto error;
 | |
|         }
 | |
| 
 | |
|         if (depth == 0)
 | |
|             break;
 | |
| 
 | |
|         SKIP_BLANKS;
 | |
|         SHRINK;
 | |
|         GROW;
 | |
|     }
 | |
| 
 | |
| error:
 | |
|     xmlFree(inputIds);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseMarkupDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse markup declarations. Always consumes '<!' or '<?'.
 | |
|  *
 | |
|  * [29] markupdecl ::= elementdecl | AttlistDecl | EntityDecl |
 | |
|  *                     NotationDecl | PI | Comment
 | |
|  *
 | |
|  * [ VC: Proper Declaration/PE Nesting ]
 | |
|  * Parameter-entity replacement text must be properly nested with
 | |
|  * markup declarations. That is to say, if either the first character
 | |
|  * or the last character of a markup declaration (markupdecl above) is
 | |
|  * contained in the replacement text for a parameter-entity reference,
 | |
|  * both must be contained in the same replacement text.
 | |
|  *
 | |
|  * [ WFC: PEs in Internal Subset ]
 | |
|  * In the internal DTD subset, parameter-entity references can occur
 | |
|  * only where markup declarations can occur, not within markup declarations.
 | |
|  * (This does not apply to references that occur in external parameter
 | |
|  * entities or to the external subset.)
 | |
|  */
 | |
| void
 | |
| xmlParseMarkupDecl(xmlParserCtxtPtr ctxt) {
 | |
|     GROW;
 | |
|     if (CUR == '<') {
 | |
|         if (NXT(1) == '!') {
 | |
| 	    switch (NXT(2)) {
 | |
| 	        case 'E':
 | |
| 		    if (NXT(3) == 'L')
 | |
| 			xmlParseElementDecl(ctxt);
 | |
| 		    else if (NXT(3) == 'N')
 | |
| 			xmlParseEntityDecl(ctxt);
 | |
|                     else
 | |
|                         SKIP(2);
 | |
| 		    break;
 | |
| 	        case 'A':
 | |
| 		    xmlParseAttributeListDecl(ctxt);
 | |
| 		    break;
 | |
| 	        case 'N':
 | |
| 		    xmlParseNotationDecl(ctxt);
 | |
| 		    break;
 | |
| 	        case '-':
 | |
| 		    xmlParseComment(ctxt);
 | |
| 		    break;
 | |
| 		default:
 | |
| 		    /* there is an error but it will be detected later */
 | |
|                     SKIP(2);
 | |
| 		    break;
 | |
| 	    }
 | |
| 	} else if (NXT(1) == '?') {
 | |
| 	    xmlParsePI(ctxt);
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * detect requirement to exit there and act accordingly
 | |
|      * and avoid having instate overridden later on
 | |
|      */
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return;
 | |
| 
 | |
|     ctxt->instate = XML_PARSER_DTD;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseTextDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an XML declaration header for external entities
 | |
|  *
 | |
|  * [77] TextDecl ::= '<?xml' VersionInfo? EncodingDecl S? '?>'
 | |
|  */
 | |
| 
 | |
| void
 | |
| xmlParseTextDecl(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar *version;
 | |
|     int oldstate;
 | |
| 
 | |
|     /*
 | |
|      * We know that '<?xml' is here.
 | |
|      */
 | |
|     if ((CMP5(CUR_PTR, '<', '?', 'x', 'm', 'l')) && (IS_BLANK_CH(NXT(5)))) {
 | |
| 	SKIP(5);
 | |
|     } else {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_XMLDECL_NOT_STARTED, NULL);
 | |
| 	return;
 | |
|     }
 | |
| 
 | |
|     /* Avoid expansion of parameter entities when skipping blanks. */
 | |
|     oldstate = ctxt->instate;
 | |
|     ctxt->instate = XML_PARSER_START;
 | |
| 
 | |
|     if (SKIP_BLANKS == 0) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 		       "Space needed after '<?xml'\n");
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * We may have the VersionInfo here.
 | |
|      */
 | |
|     version = xmlParseVersionInfo(ctxt);
 | |
|     if (version == NULL)
 | |
| 	version = xmlCharStrdup(XML_DEFAULT_VERSION);
 | |
|     else {
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 		           "Space needed here\n");
 | |
| 	}
 | |
|     }
 | |
|     ctxt->input->version = version;
 | |
| 
 | |
|     /*
 | |
|      * We must have the encoding declaration
 | |
|      */
 | |
|     xmlParseEncodingDecl(ctxt);
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return;
 | |
|     if (ctxt->errNo == XML_ERR_UNSUPPORTED_ENCODING) {
 | |
| 	/*
 | |
| 	 * The XML REC instructs us to stop parsing right here
 | |
| 	 */
 | |
|         ctxt->instate = oldstate;
 | |
|         return;
 | |
|     }
 | |
| 
 | |
|     SKIP_BLANKS;
 | |
|     if ((RAW == '?') && (NXT(1) == '>')) {
 | |
|         SKIP(2);
 | |
|     } else if (RAW == '>') {
 | |
|         /* Deprecated old WD ... */
 | |
| 	xmlFatalErr(ctxt, XML_ERR_XMLDECL_NOT_FINISHED, NULL);
 | |
| 	NEXT;
 | |
|     } else {
 | |
|         int c;
 | |
| 
 | |
| 	xmlFatalErr(ctxt, XML_ERR_XMLDECL_NOT_FINISHED, NULL);
 | |
|         while ((c = CUR) != 0) {
 | |
|             NEXT;
 | |
|             if (c == '>')
 | |
|                 break;
 | |
|         }
 | |
|         if (ctxt->instate == XML_PARSER_EOF)
 | |
|             return;
 | |
|     }
 | |
| 
 | |
|     ctxt->instate = oldstate;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseExternalSubset:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @ExternalID: the external identifier
 | |
|  * @SystemID: the system identifier (or URL)
 | |
|  *
 | |
|  * parse Markup declarations from an external subset
 | |
|  *
 | |
|  * [30] extSubset ::= textDecl? extSubsetDecl
 | |
|  *
 | |
|  * [31] extSubsetDecl ::= (markupdecl | conditionalSect | PEReference | S) *
 | |
|  */
 | |
| void
 | |
| xmlParseExternalSubset(xmlParserCtxtPtr ctxt, const xmlChar *ExternalID,
 | |
|                        const xmlChar *SystemID) {
 | |
|     xmlDetectSAX2(ctxt);
 | |
| 
 | |
|     xmlDetectEncoding(ctxt);
 | |
| 
 | |
|     if (CMP5(CUR_PTR, '<', '?', 'x', 'm', 'l')) {
 | |
| 	xmlParseTextDecl(ctxt);
 | |
| 	if (ctxt->errNo == XML_ERR_UNSUPPORTED_ENCODING) {
 | |
| 	    /*
 | |
| 	     * The XML REC instructs us to stop parsing right here
 | |
| 	     */
 | |
| 	    xmlHaltParser(ctxt);
 | |
| 	    return;
 | |
| 	}
 | |
|     }
 | |
|     if (ctxt->myDoc == NULL) {
 | |
|         ctxt->myDoc = xmlNewDoc(BAD_CAST "1.0");
 | |
| 	if (ctxt->myDoc == NULL) {
 | |
| 	    xmlErrMemory(ctxt, "New Doc failed");
 | |
| 	    return;
 | |
| 	}
 | |
| 	ctxt->myDoc->properties = XML_DOC_INTERNAL;
 | |
|     }
 | |
|     if ((ctxt->myDoc != NULL) && (ctxt->myDoc->intSubset == NULL))
 | |
|         xmlCreateIntSubset(ctxt->myDoc, NULL, ExternalID, SystemID);
 | |
| 
 | |
|     ctxt->instate = XML_PARSER_DTD;
 | |
|     ctxt->external = 1;
 | |
|     SKIP_BLANKS;
 | |
|     while ((ctxt->instate != XML_PARSER_EOF) && (RAW != 0)) {
 | |
| 	GROW;
 | |
|         if ((RAW == '<') && (NXT(1) == '!') && (NXT(2) == '[')) {
 | |
|             xmlParseConditionalSections(ctxt);
 | |
|         } else if ((RAW == '<') && ((NXT(1) == '!') || (NXT(1) == '?'))) {
 | |
|             xmlParseMarkupDecl(ctxt);
 | |
|         } else {
 | |
|             xmlFatalErr(ctxt, XML_ERR_EXT_SUBSET_NOT_FINISHED, NULL);
 | |
|             xmlHaltParser(ctxt);
 | |
|             return;
 | |
|         }
 | |
|         SKIP_BLANKS;
 | |
|         SHRINK;
 | |
|     }
 | |
| 
 | |
|     if (RAW != 0) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_EXT_SUBSET_NOT_FINISHED, NULL);
 | |
|     }
 | |
| 
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseReference:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse and handle entity references in content, depending on the SAX
 | |
|  * interface, this may end-up in a call to character() if this is a
 | |
|  * CharRef, a predefined entity, if there is no reference() callback.
 | |
|  * or if the parser was asked to switch to that mode.
 | |
|  *
 | |
|  * Always consumes '&'.
 | |
|  *
 | |
|  * [67] Reference ::= EntityRef | CharRef
 | |
|  */
 | |
| void
 | |
| xmlParseReference(xmlParserCtxtPtr ctxt) {
 | |
|     xmlEntityPtr ent;
 | |
|     xmlChar *val;
 | |
|     int was_checked;
 | |
|     xmlNodePtr list = NULL;
 | |
|     xmlParserErrors ret = XML_ERR_OK;
 | |
| 
 | |
| 
 | |
|     if (RAW != '&')
 | |
|         return;
 | |
| 
 | |
|     /*
 | |
|      * Simple case of a CharRef
 | |
|      */
 | |
|     if (NXT(1) == '#') {
 | |
| 	int i = 0;
 | |
| 	xmlChar out[16];
 | |
| 	int value = xmlParseCharRef(ctxt);
 | |
| 
 | |
| 	if (value == 0)
 | |
| 	    return;
 | |
| 
 | |
|         /*
 | |
|          * Just encode the value in UTF-8
 | |
|          */
 | |
|         COPY_BUF(out, i, value);
 | |
|         out[i] = 0;
 | |
|         if ((ctxt->sax != NULL) && (ctxt->sax->characters != NULL) &&
 | |
|             (!ctxt->disableSAX))
 | |
|             ctxt->sax->characters(ctxt->userData, out, i);
 | |
| 	return;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * We are seeing an entity reference
 | |
|      */
 | |
|     ent = xmlParseEntityRef(ctxt);
 | |
|     if (ent == NULL) return;
 | |
|     if (!ctxt->wellFormed)
 | |
| 	return;
 | |
|     was_checked = ent->flags & XML_ENT_PARSED;
 | |
| 
 | |
|     /* special case of predefined entities */
 | |
|     if ((ent->name == NULL) ||
 | |
|         (ent->etype == XML_INTERNAL_PREDEFINED_ENTITY)) {
 | |
| 	val = ent->content;
 | |
| 	if (val == NULL) return;
 | |
| 	/*
 | |
| 	 * inline the entity.
 | |
| 	 */
 | |
| 	if ((ctxt->sax != NULL) && (ctxt->sax->characters != NULL) &&
 | |
| 	    (!ctxt->disableSAX))
 | |
| 	    ctxt->sax->characters(ctxt->userData, val, xmlStrlen(val));
 | |
| 	return;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * The first reference to the entity trigger a parsing phase
 | |
|      * where the ent->children is filled with the result from
 | |
|      * the parsing.
 | |
|      * Note: external parsed entities will not be loaded, it is not
 | |
|      * required for a non-validating parser, unless the parsing option
 | |
|      * of validating, or substituting entities were given. Doing so is
 | |
|      * far more secure as the parser will only process data coming from
 | |
|      * the document entity by default.
 | |
|      *
 | |
|      * FIXME: This doesn't work correctly since entities can be
 | |
|      * expanded with different namespace declarations in scope.
 | |
|      * For example:
 | |
|      *
 | |
|      * <!DOCTYPE doc [
 | |
|      *   <!ENTITY ent "<ns:elem/>">
 | |
|      * ]>
 | |
|      * <doc>
 | |
|      *   <decl1 xmlns:ns="urn:ns1">
 | |
|      *     &ent;
 | |
|      *   </decl1>
 | |
|      *   <decl2 xmlns:ns="urn:ns2">
 | |
|      *     &ent;
 | |
|      *   </decl2>
 | |
|      * </doc>
 | |
|      *
 | |
|      * Proposed fix:
 | |
|      *
 | |
|      * - Remove the ent->owner optimization which tries to avoid the
 | |
|      *   initial copy of the entity. Always make entities own the
 | |
|      *   subtree.
 | |
|      * - Ignore current namespace declarations when parsing the
 | |
|      *   entity. If a prefix can't be resolved, don't report an error
 | |
|      *   but mark it as unresolved.
 | |
|      * - Try to resolve these prefixes when expanding the entity.
 | |
|      *   This will require a specialized version of xmlStaticCopyNode
 | |
|      *   which can also make use of the namespace hash table to avoid
 | |
|      *   quadratic behavior.
 | |
|      *
 | |
|      * Alternatively, we could simply reparse the entity on each
 | |
|      * expansion like we already do with custom SAX callbacks.
 | |
|      * External entity content should be cached in this case.
 | |
|      */
 | |
|     if (((ent->flags & XML_ENT_PARSED) == 0) &&
 | |
|         ((ent->etype != XML_EXTERNAL_GENERAL_PARSED_ENTITY) ||
 | |
|          (ctxt->options & (XML_PARSE_NOENT | XML_PARSE_DTDVALID)))) {
 | |
| 	unsigned long oldsizeentcopy = ctxt->sizeentcopy;
 | |
| 
 | |
| 	/*
 | |
| 	 * This is a bit hackish but this seems the best
 | |
| 	 * way to make sure both SAX and DOM entity support
 | |
| 	 * behaves okay.
 | |
| 	 */
 | |
| 	void *user_data;
 | |
| 	if (ctxt->userData == ctxt)
 | |
| 	    user_data = NULL;
 | |
| 	else
 | |
| 	    user_data = ctxt->userData;
 | |
| 
 | |
|         /* Avoid overflow as much as possible */
 | |
|         ctxt->sizeentcopy = 0;
 | |
| 
 | |
|         if (ent->flags & XML_ENT_EXPANDING) {
 | |
|             xmlFatalErr(ctxt, XML_ERR_ENTITY_LOOP, NULL);
 | |
|             xmlHaltParser(ctxt);
 | |
|             return;
 | |
|         }
 | |
| 
 | |
|         ent->flags |= XML_ENT_EXPANDING;
 | |
| 
 | |
| 	/*
 | |
| 	 * Check that this entity is well formed
 | |
| 	 * 4.3.2: An internal general parsed entity is well-formed
 | |
| 	 * if its replacement text matches the production labeled
 | |
| 	 * content.
 | |
| 	 */
 | |
| 	if (ent->etype == XML_INTERNAL_GENERAL_ENTITY) {
 | |
| 	    ctxt->depth++;
 | |
| 	    ret = xmlParseBalancedChunkMemoryInternal(ctxt, ent->content,
 | |
| 	                                              user_data, &list);
 | |
| 	    ctxt->depth--;
 | |
| 
 | |
| 	} else if (ent->etype == XML_EXTERNAL_GENERAL_PARSED_ENTITY) {
 | |
| 	    ctxt->depth++;
 | |
| 	    ret = xmlParseExternalEntityPrivate(ctxt->myDoc, ctxt, ctxt->sax,
 | |
| 	                                   user_data, ctxt->depth, ent->URI,
 | |
| 					   ent->ExternalID, &list);
 | |
| 	    ctxt->depth--;
 | |
| 	} else {
 | |
| 	    ret = XML_ERR_ENTITY_PE_INTERNAL;
 | |
| 	    xmlErrMsgStr(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
| 			 "invalid entity type found\n", NULL);
 | |
| 	}
 | |
| 
 | |
|         ent->flags &= ~XML_ENT_EXPANDING;
 | |
|         ent->flags |= XML_ENT_PARSED | XML_ENT_CHECKED;
 | |
|         ent->expandedSize = ctxt->sizeentcopy;
 | |
| 	if (ret == XML_ERR_ENTITY_LOOP) {
 | |
|             xmlHaltParser(ctxt);
 | |
| 	    xmlFreeNodeList(list);
 | |
| 	    return;
 | |
| 	}
 | |
| 	if (xmlParserEntityCheck(ctxt, oldsizeentcopy)) {
 | |
| 	    xmlFreeNodeList(list);
 | |
| 	    return;
 | |
| 	}
 | |
| 
 | |
| 	if ((ret == XML_ERR_OK) && (list != NULL)) {
 | |
|             ent->children = list;
 | |
|             /*
 | |
|              * Prune it directly in the generated document
 | |
|              * except for single text nodes.
 | |
|              */
 | |
|             if ((ctxt->replaceEntities == 0) ||
 | |
|                 (ctxt->parseMode == XML_PARSE_READER) ||
 | |
|                 ((list->type == XML_TEXT_NODE) &&
 | |
|                  (list->next == NULL))) {
 | |
|                 ent->owner = 1;
 | |
|                 while (list != NULL) {
 | |
|                     list->parent = (xmlNodePtr) ent;
 | |
|                     if (list->doc != ent->doc)
 | |
|                         xmlSetTreeDoc(list, ent->doc);
 | |
|                     if (list->next == NULL)
 | |
|                         ent->last = list;
 | |
|                     list = list->next;
 | |
|                 }
 | |
|                 list = NULL;
 | |
|             } else {
 | |
|                 ent->owner = 0;
 | |
|                 while (list != NULL) {
 | |
|                     list->parent = (xmlNodePtr) ctxt->node;
 | |
|                     list->doc = ctxt->myDoc;
 | |
|                     if (list->next == NULL)
 | |
|                         ent->last = list;
 | |
|                     list = list->next;
 | |
|                 }
 | |
|                 list = ent->children;
 | |
| #ifdef LIBXML_LEGACY_ENABLED
 | |
|                 if (ent->etype == XML_EXTERNAL_GENERAL_PARSED_ENTITY)
 | |
|                     xmlAddEntityReference(ent, list, NULL);
 | |
| #endif /* LIBXML_LEGACY_ENABLED */
 | |
|             }
 | |
| 	} else if ((ret != XML_ERR_OK) &&
 | |
| 		   (ret != XML_WAR_UNDECLARED_ENTITY)) {
 | |
| 	    xmlFatalErrMsgStr(ctxt, XML_ERR_UNDECLARED_ENTITY,
 | |
| 		     "Entity '%s' failed to parse\n", ent->name);
 | |
|             if (ent->content != NULL)
 | |
|                 ent->content[0] = 0;
 | |
| 	} else if (list != NULL) {
 | |
| 	    xmlFreeNodeList(list);
 | |
| 	    list = NULL;
 | |
| 	}
 | |
| 
 | |
|         /* Prevent entity from being parsed and expanded twice (Bug 760367). */
 | |
|         was_checked = 0;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Now that the entity content has been gathered
 | |
|      * provide it to the application, this can take different forms based
 | |
|      * on the parsing modes.
 | |
|      */
 | |
|     if (ent->children == NULL) {
 | |
| 	/*
 | |
| 	 * Probably running in SAX mode and the callbacks don't
 | |
| 	 * build the entity content. So unless we already went
 | |
| 	 * though parsing for first checking go though the entity
 | |
| 	 * content to generate callbacks associated to the entity
 | |
| 	 */
 | |
| 	if (was_checked != 0) {
 | |
| 	    void *user_data;
 | |
| 	    /*
 | |
| 	     * This is a bit hackish but this seems the best
 | |
| 	     * way to make sure both SAX and DOM entity support
 | |
| 	     * behaves okay.
 | |
| 	     */
 | |
| 	    if (ctxt->userData == ctxt)
 | |
| 		user_data = NULL;
 | |
| 	    else
 | |
| 		user_data = ctxt->userData;
 | |
| 
 | |
| 	    if (ent->etype == XML_INTERNAL_GENERAL_ENTITY) {
 | |
| 		ctxt->depth++;
 | |
| 		ret = xmlParseBalancedChunkMemoryInternal(ctxt,
 | |
| 				   ent->content, user_data, NULL);
 | |
| 		ctxt->depth--;
 | |
| 	    } else if (ent->etype ==
 | |
| 		       XML_EXTERNAL_GENERAL_PARSED_ENTITY) {
 | |
| 	        unsigned long oldsizeentities = ctxt->sizeentities;
 | |
| 
 | |
| 		ctxt->depth++;
 | |
| 		ret = xmlParseExternalEntityPrivate(ctxt->myDoc, ctxt,
 | |
| 			   ctxt->sax, user_data, ctxt->depth,
 | |
| 			   ent->URI, ent->ExternalID, NULL);
 | |
| 		ctxt->depth--;
 | |
| 
 | |
|                 /* Undo the change to sizeentities */
 | |
|                 ctxt->sizeentities = oldsizeentities;
 | |
| 	    } else {
 | |
| 		ret = XML_ERR_ENTITY_PE_INTERNAL;
 | |
| 		xmlErrMsgStr(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
| 			     "invalid entity type found\n", NULL);
 | |
| 	    }
 | |
| 	    if (ret == XML_ERR_ENTITY_LOOP) {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_ENTITY_LOOP, NULL);
 | |
| 		return;
 | |
| 	    }
 | |
|             if (xmlParserEntityCheck(ctxt, 0))
 | |
|                 return;
 | |
| 	}
 | |
| 	if ((ctxt->sax != NULL) && (ctxt->sax->reference != NULL) &&
 | |
| 	    (ctxt->replaceEntities == 0) && (!ctxt->disableSAX)) {
 | |
| 	    /*
 | |
| 	     * Entity reference callback comes second, it's somewhat
 | |
| 	     * superfluous but a compatibility to historical behaviour
 | |
| 	     */
 | |
| 	    ctxt->sax->reference(ctxt->userData, ent->name);
 | |
| 	}
 | |
| 	return;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * We also check for amplification if entities aren't substituted.
 | |
|      * They might be expanded later.
 | |
|      */
 | |
|     if ((was_checked != 0) &&
 | |
|         (xmlParserEntityCheck(ctxt, ent->expandedSize)))
 | |
|         return;
 | |
| 
 | |
|     /*
 | |
|      * If we didn't get any children for the entity being built
 | |
|      */
 | |
|     if ((ctxt->sax != NULL) && (ctxt->sax->reference != NULL) &&
 | |
| 	(ctxt->replaceEntities == 0) && (!ctxt->disableSAX)) {
 | |
| 	/*
 | |
| 	 * Create a node.
 | |
| 	 */
 | |
| 	ctxt->sax->reference(ctxt->userData, ent->name);
 | |
| 	return;
 | |
|     }
 | |
| 
 | |
|     if (ctxt->replaceEntities)  {
 | |
| 	/*
 | |
| 	 * There is a problem on the handling of _private for entities
 | |
| 	 * (bug 155816): Should we copy the content of the field from
 | |
| 	 * the entity (possibly overwriting some value set by the user
 | |
| 	 * when a copy is created), should we leave it alone, or should
 | |
| 	 * we try to take care of different situations?  The problem
 | |
| 	 * is exacerbated by the usage of this field by the xmlReader.
 | |
| 	 * To fix this bug, we look at _private on the created node
 | |
| 	 * and, if it's NULL, we copy in whatever was in the entity.
 | |
| 	 * If it's not NULL we leave it alone.  This is somewhat of a
 | |
| 	 * hack - maybe we should have further tests to determine
 | |
| 	 * what to do.
 | |
| 	 */
 | |
| 	if (ctxt->node != NULL) {
 | |
| 	    /*
 | |
| 	     * Seems we are generating the DOM content, do
 | |
| 	     * a simple tree copy for all references except the first
 | |
| 	     * In the first occurrence list contains the replacement.
 | |
| 	     */
 | |
| 	    if (((list == NULL) && (ent->owner == 0)) ||
 | |
| 		(ctxt->parseMode == XML_PARSE_READER)) {
 | |
| 		xmlNodePtr nw = NULL, cur, firstChild = NULL;
 | |
| 
 | |
| 		/*
 | |
| 		 * when operating on a reader, the entities definitions
 | |
| 		 * are always owning the entities subtree.
 | |
| 		if (ctxt->parseMode == XML_PARSE_READER)
 | |
| 		    ent->owner = 1;
 | |
| 		 */
 | |
| 
 | |
| 		cur = ent->children;
 | |
| 		while (cur != NULL) {
 | |
| 		    nw = xmlDocCopyNode(cur, ctxt->myDoc, 1);
 | |
| 		    if (nw != NULL) {
 | |
| 			if (nw->_private == NULL)
 | |
| 			    nw->_private = cur->_private;
 | |
| 			if (firstChild == NULL){
 | |
| 			    firstChild = nw;
 | |
| 			}
 | |
| 			nw = xmlAddChild(ctxt->node, nw);
 | |
| 		    }
 | |
| 		    if (cur == ent->last) {
 | |
| 			/*
 | |
| 			 * needed to detect some strange empty
 | |
| 			 * node cases in the reader tests
 | |
| 			 */
 | |
| 			if ((ctxt->parseMode == XML_PARSE_READER) &&
 | |
| 			    (nw != NULL) &&
 | |
| 			    (nw->type == XML_ELEMENT_NODE) &&
 | |
| 			    (nw->children == NULL))
 | |
| 			    nw->extra = 1;
 | |
| 
 | |
| 			break;
 | |
| 		    }
 | |
| 		    cur = cur->next;
 | |
| 		}
 | |
| #ifdef LIBXML_LEGACY_ENABLED
 | |
| 		if (ent->etype == XML_EXTERNAL_GENERAL_PARSED_ENTITY)
 | |
| 		  xmlAddEntityReference(ent, firstChild, nw);
 | |
| #endif /* LIBXML_LEGACY_ENABLED */
 | |
| 	    } else if ((list == NULL) || (ctxt->inputNr > 0)) {
 | |
| 		xmlNodePtr nw = NULL, cur, next, last,
 | |
| 			   firstChild = NULL;
 | |
| 
 | |
| 		/*
 | |
| 		 * Copy the entity child list and make it the new
 | |
| 		 * entity child list. The goal is to make sure any
 | |
| 		 * ID or REF referenced will be the one from the
 | |
| 		 * document content and not the entity copy.
 | |
| 		 */
 | |
| 		cur = ent->children;
 | |
| 		ent->children = NULL;
 | |
| 		last = ent->last;
 | |
| 		ent->last = NULL;
 | |
| 		while (cur != NULL) {
 | |
| 		    next = cur->next;
 | |
| 		    cur->next = NULL;
 | |
| 		    cur->parent = NULL;
 | |
| 		    nw = xmlDocCopyNode(cur, ctxt->myDoc, 1);
 | |
| 		    if (nw != NULL) {
 | |
| 			if (nw->_private == NULL)
 | |
| 			    nw->_private = cur->_private;
 | |
| 			if (firstChild == NULL){
 | |
| 			    firstChild = cur;
 | |
| 			}
 | |
| 			xmlAddChild((xmlNodePtr) ent, nw);
 | |
| 		    }
 | |
| 		    xmlAddChild(ctxt->node, cur);
 | |
| 		    if (cur == last)
 | |
| 			break;
 | |
| 		    cur = next;
 | |
| 		}
 | |
| 		if (ent->owner == 0)
 | |
| 		    ent->owner = 1;
 | |
| #ifdef LIBXML_LEGACY_ENABLED
 | |
| 		if (ent->etype == XML_EXTERNAL_GENERAL_PARSED_ENTITY)
 | |
| 		  xmlAddEntityReference(ent, firstChild, nw);
 | |
| #endif /* LIBXML_LEGACY_ENABLED */
 | |
| 	    } else {
 | |
| 		const xmlChar *nbktext;
 | |
| 
 | |
| 		/*
 | |
| 		 * the name change is to avoid coalescing of the
 | |
| 		 * node with a possible previous text one which
 | |
| 		 * would make ent->children a dangling pointer
 | |
| 		 */
 | |
| 		nbktext = xmlDictLookup(ctxt->dict, BAD_CAST "nbktext",
 | |
| 					-1);
 | |
| 		if (ent->children->type == XML_TEXT_NODE)
 | |
| 		    ent->children->name = nbktext;
 | |
| 		if ((ent->last != ent->children) &&
 | |
| 		    (ent->last->type == XML_TEXT_NODE))
 | |
| 		    ent->last->name = nbktext;
 | |
| 		xmlAddChildList(ctxt->node, ent->children);
 | |
| 	    }
 | |
| 
 | |
| 	    /*
 | |
| 	     * This is to avoid a nasty side effect, see
 | |
| 	     * characters() in SAX.c
 | |
| 	     */
 | |
| 	    ctxt->nodemem = 0;
 | |
| 	    ctxt->nodelen = 0;
 | |
| 	    return;
 | |
| 	}
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseEntityRef:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse an entitiy reference. Always consumes '&'.
 | |
|  *
 | |
|  * [68] EntityRef ::= '&' Name ';'
 | |
|  *
 | |
|  * [ WFC: Entity Declared ]
 | |
|  * In a document without any DTD, a document with only an internal DTD
 | |
|  * subset which contains no parameter entity references, or a document
 | |
|  * with "standalone='yes'", the Name given in the entity reference
 | |
|  * must match that in an entity declaration, except that well-formed
 | |
|  * documents need not declare any of the following entities: amp, lt,
 | |
|  * gt, apos, quot.  The declaration of a parameter entity must precede
 | |
|  * any reference to it.  Similarly, the declaration of a general entity
 | |
|  * must precede any reference to it which appears in a default value in an
 | |
|  * attribute-list declaration. Note that if entities are declared in the
 | |
|  * external subset or in external parameter entities, a non-validating
 | |
|  * processor is not obligated to read and process their declarations;
 | |
|  * for such documents, the rule that an entity must be declared is a
 | |
|  * well-formedness constraint only if standalone='yes'.
 | |
|  *
 | |
|  * [ WFC: Parsed Entity ]
 | |
|  * An entity reference must not contain the name of an unparsed entity
 | |
|  *
 | |
|  * Returns the xmlEntityPtr if found, or NULL otherwise.
 | |
|  */
 | |
| xmlEntityPtr
 | |
| xmlParseEntityRef(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *name;
 | |
|     xmlEntityPtr ent = NULL;
 | |
| 
 | |
|     GROW;
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return(NULL);
 | |
| 
 | |
|     if (RAW != '&')
 | |
|         return(NULL);
 | |
|     NEXT;
 | |
|     name = xmlParseName(ctxt);
 | |
|     if (name == NULL) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 		       "xmlParseEntityRef: no name\n");
 | |
|         return(NULL);
 | |
|     }
 | |
|     if (RAW != ';') {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_ENTITYREF_SEMICOL_MISSING, NULL);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     NEXT;
 | |
| 
 | |
|     /*
 | |
|      * Predefined entities override any extra definition
 | |
|      */
 | |
|     if ((ctxt->options & XML_PARSE_OLDSAX) == 0) {
 | |
|         ent = xmlGetPredefinedEntity(name);
 | |
|         if (ent != NULL)
 | |
|             return(ent);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Ask first SAX for entity resolution, otherwise try the
 | |
|      * entities which may have stored in the parser context.
 | |
|      */
 | |
|     if (ctxt->sax != NULL) {
 | |
| 	if (ctxt->sax->getEntity != NULL)
 | |
| 	    ent = ctxt->sax->getEntity(ctxt->userData, name);
 | |
| 	if ((ctxt->wellFormed == 1 ) && (ent == NULL) &&
 | |
| 	    (ctxt->options & XML_PARSE_OLDSAX))
 | |
| 	    ent = xmlGetPredefinedEntity(name);
 | |
| 	if ((ctxt->wellFormed == 1 ) && (ent == NULL) &&
 | |
| 	    (ctxt->userData==ctxt)) {
 | |
| 	    ent = xmlSAX2GetEntity(ctxt, name);
 | |
| 	}
 | |
|     }
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
| 	return(NULL);
 | |
|     /*
 | |
|      * [ WFC: Entity Declared ]
 | |
|      * In a document without any DTD, a document with only an
 | |
|      * internal DTD subset which contains no parameter entity
 | |
|      * references, or a document with "standalone='yes'", the
 | |
|      * Name given in the entity reference must match that in an
 | |
|      * entity declaration, except that well-formed documents
 | |
|      * need not declare any of the following entities: amp, lt,
 | |
|      * gt, apos, quot.
 | |
|      * The declaration of a parameter entity must precede any
 | |
|      * reference to it.
 | |
|      * Similarly, the declaration of a general entity must
 | |
|      * precede any reference to it which appears in a default
 | |
|      * value in an attribute-list declaration. Note that if
 | |
|      * entities are declared in the external subset or in
 | |
|      * external parameter entities, a non-validating processor
 | |
|      * is not obligated to read and process their declarations;
 | |
|      * for such documents, the rule that an entity must be
 | |
|      * declared is a well-formedness constraint only if
 | |
|      * standalone='yes'.
 | |
|      */
 | |
|     if (ent == NULL) {
 | |
| 	if ((ctxt->standalone == 1) ||
 | |
| 	    ((ctxt->hasExternalSubset == 0) &&
 | |
| 	     (ctxt->hasPErefs == 0))) {
 | |
| 	    xmlFatalErrMsgStr(ctxt, XML_ERR_UNDECLARED_ENTITY,
 | |
| 		     "Entity '%s' not defined\n", name);
 | |
| 	} else {
 | |
| 	    xmlErrMsgStr(ctxt, XML_WAR_UNDECLARED_ENTITY,
 | |
| 		     "Entity '%s' not defined\n", name);
 | |
| 	    if ((ctxt->inSubset == 0) &&
 | |
| 		(ctxt->sax != NULL) &&
 | |
|                 (ctxt->disableSAX == 0) &&
 | |
| 		(ctxt->sax->reference != NULL)) {
 | |
| 		ctxt->sax->reference(ctxt->userData, name);
 | |
| 	    }
 | |
| 	}
 | |
| 	ctxt->valid = 0;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * [ WFC: Parsed Entity ]
 | |
|      * An entity reference must not contain the name of an
 | |
|      * unparsed entity
 | |
|      */
 | |
|     else if (ent->etype == XML_EXTERNAL_GENERAL_UNPARSED_ENTITY) {
 | |
| 	xmlFatalErrMsgStr(ctxt, XML_ERR_UNPARSED_ENTITY,
 | |
| 		 "Entity reference to unparsed entity %s\n", name);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * [ WFC: No External Entity References ]
 | |
|      * Attribute values cannot contain direct or indirect
 | |
|      * entity references to external entities.
 | |
|      */
 | |
|     else if ((ctxt->instate == XML_PARSER_ATTRIBUTE_VALUE) &&
 | |
| 	     (ent->etype == XML_EXTERNAL_GENERAL_PARSED_ENTITY)) {
 | |
| 	xmlFatalErrMsgStr(ctxt, XML_ERR_ENTITY_IS_EXTERNAL,
 | |
| 	     "Attribute references external entity '%s'\n", name);
 | |
|     }
 | |
|     /*
 | |
|      * [ WFC: No < in Attribute Values ]
 | |
|      * The replacement text of any entity referred to directly or
 | |
|      * indirectly in an attribute value (other than "<") must
 | |
|      * not contain a <.
 | |
|      */
 | |
|     else if ((ctxt->instate == XML_PARSER_ATTRIBUTE_VALUE) &&
 | |
| 	     (ent->etype != XML_INTERNAL_PREDEFINED_ENTITY)) {
 | |
| 	if ((ent->flags & XML_ENT_CHECKED_LT) == 0) {
 | |
|             if ((ent->content != NULL) && (xmlStrchr(ent->content, '<')))
 | |
|                 ent->flags |= XML_ENT_CONTAINS_LT;
 | |
|             ent->flags |= XML_ENT_CHECKED_LT;
 | |
|         }
 | |
|         if (ent->flags & XML_ENT_CONTAINS_LT)
 | |
|             xmlFatalErrMsgStr(ctxt, XML_ERR_LT_IN_ATTRIBUTE,
 | |
|                     "'<' in entity '%s' is not allowed in attributes "
 | |
|                     "values\n", name);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Internal check, no parameter entities here ...
 | |
|      */
 | |
|     else {
 | |
| 	switch (ent->etype) {
 | |
| 	    case XML_INTERNAL_PARAMETER_ENTITY:
 | |
| 	    case XML_EXTERNAL_PARAMETER_ENTITY:
 | |
| 	    xmlFatalErrMsgStr(ctxt, XML_ERR_ENTITY_IS_PARAMETER,
 | |
| 	     "Attempt to reference the parameter entity '%s'\n",
 | |
| 			      name);
 | |
| 	    break;
 | |
| 	    default:
 | |
| 	    break;
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * [ WFC: No Recursion ]
 | |
|      * A parsed entity must not contain a recursive reference
 | |
|      * to itself, either directly or indirectly.
 | |
|      * Done somewhere else
 | |
|      */
 | |
|     return(ent);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseStringEntityRef:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @str:  a pointer to an index in the string
 | |
|  *
 | |
|  * parse ENTITY references declarations, but this version parses it from
 | |
|  * a string value.
 | |
|  *
 | |
|  * [68] EntityRef ::= '&' Name ';'
 | |
|  *
 | |
|  * [ WFC: Entity Declared ]
 | |
|  * In a document without any DTD, a document with only an internal DTD
 | |
|  * subset which contains no parameter entity references, or a document
 | |
|  * with "standalone='yes'", the Name given in the entity reference
 | |
|  * must match that in an entity declaration, except that well-formed
 | |
|  * documents need not declare any of the following entities: amp, lt,
 | |
|  * gt, apos, quot.  The declaration of a parameter entity must precede
 | |
|  * any reference to it.  Similarly, the declaration of a general entity
 | |
|  * must precede any reference to it which appears in a default value in an
 | |
|  * attribute-list declaration. Note that if entities are declared in the
 | |
|  * external subset or in external parameter entities, a non-validating
 | |
|  * processor is not obligated to read and process their declarations;
 | |
|  * for such documents, the rule that an entity must be declared is a
 | |
|  * well-formedness constraint only if standalone='yes'.
 | |
|  *
 | |
|  * [ WFC: Parsed Entity ]
 | |
|  * An entity reference must not contain the name of an unparsed entity
 | |
|  *
 | |
|  * Returns the xmlEntityPtr if found, or NULL otherwise. The str pointer
 | |
|  * is updated to the current location in the string.
 | |
|  */
 | |
| static xmlEntityPtr
 | |
| xmlParseStringEntityRef(xmlParserCtxtPtr ctxt, const xmlChar ** str) {
 | |
|     xmlChar *name;
 | |
|     const xmlChar *ptr;
 | |
|     xmlChar cur;
 | |
|     xmlEntityPtr ent = NULL;
 | |
| 
 | |
|     if ((str == NULL) || (*str == NULL))
 | |
|         return(NULL);
 | |
|     ptr = *str;
 | |
|     cur = *ptr;
 | |
|     if (cur != '&')
 | |
| 	return(NULL);
 | |
| 
 | |
|     ptr++;
 | |
|     name = xmlParseStringName(ctxt, &ptr);
 | |
|     if (name == NULL) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 		       "xmlParseStringEntityRef: no name\n");
 | |
| 	*str = ptr;
 | |
| 	return(NULL);
 | |
|     }
 | |
|     if (*ptr != ';') {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_ENTITYREF_SEMICOL_MISSING, NULL);
 | |
|         xmlFree(name);
 | |
| 	*str = ptr;
 | |
| 	return(NULL);
 | |
|     }
 | |
|     ptr++;
 | |
| 
 | |
| 
 | |
|     /*
 | |
|      * Predefined entities override any extra definition
 | |
|      */
 | |
|     if ((ctxt->options & XML_PARSE_OLDSAX) == 0) {
 | |
|         ent = xmlGetPredefinedEntity(name);
 | |
|         if (ent != NULL) {
 | |
|             xmlFree(name);
 | |
|             *str = ptr;
 | |
|             return(ent);
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Ask first SAX for entity resolution, otherwise try the
 | |
|      * entities which may have stored in the parser context.
 | |
|      */
 | |
|     if (ctxt->sax != NULL) {
 | |
| 	if (ctxt->sax->getEntity != NULL)
 | |
| 	    ent = ctxt->sax->getEntity(ctxt->userData, name);
 | |
| 	if ((ent == NULL) && (ctxt->options & XML_PARSE_OLDSAX))
 | |
| 	    ent = xmlGetPredefinedEntity(name);
 | |
| 	if ((ent == NULL) && (ctxt->userData==ctxt)) {
 | |
| 	    ent = xmlSAX2GetEntity(ctxt, name);
 | |
| 	}
 | |
|     }
 | |
|     if (ctxt->instate == XML_PARSER_EOF) {
 | |
| 	xmlFree(name);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * [ WFC: Entity Declared ]
 | |
|      * In a document without any DTD, a document with only an
 | |
|      * internal DTD subset which contains no parameter entity
 | |
|      * references, or a document with "standalone='yes'", the
 | |
|      * Name given in the entity reference must match that in an
 | |
|      * entity declaration, except that well-formed documents
 | |
|      * need not declare any of the following entities: amp, lt,
 | |
|      * gt, apos, quot.
 | |
|      * The declaration of a parameter entity must precede any
 | |
|      * reference to it.
 | |
|      * Similarly, the declaration of a general entity must
 | |
|      * precede any reference to it which appears in a default
 | |
|      * value in an attribute-list declaration. Note that if
 | |
|      * entities are declared in the external subset or in
 | |
|      * external parameter entities, a non-validating processor
 | |
|      * is not obligated to read and process their declarations;
 | |
|      * for such documents, the rule that an entity must be
 | |
|      * declared is a well-formedness constraint only if
 | |
|      * standalone='yes'.
 | |
|      */
 | |
|     if (ent == NULL) {
 | |
| 	if ((ctxt->standalone == 1) ||
 | |
| 	    ((ctxt->hasExternalSubset == 0) &&
 | |
| 	     (ctxt->hasPErefs == 0))) {
 | |
| 	    xmlFatalErrMsgStr(ctxt, XML_ERR_UNDECLARED_ENTITY,
 | |
| 		     "Entity '%s' not defined\n", name);
 | |
| 	} else {
 | |
| 	    xmlErrMsgStr(ctxt, XML_WAR_UNDECLARED_ENTITY,
 | |
| 			  "Entity '%s' not defined\n",
 | |
| 			  name);
 | |
| 	}
 | |
| 	/* TODO ? check regressions ctxt->valid = 0; */
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * [ WFC: Parsed Entity ]
 | |
|      * An entity reference must not contain the name of an
 | |
|      * unparsed entity
 | |
|      */
 | |
|     else if (ent->etype == XML_EXTERNAL_GENERAL_UNPARSED_ENTITY) {
 | |
| 	xmlFatalErrMsgStr(ctxt, XML_ERR_UNPARSED_ENTITY,
 | |
| 		 "Entity reference to unparsed entity %s\n", name);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * [ WFC: No External Entity References ]
 | |
|      * Attribute values cannot contain direct or indirect
 | |
|      * entity references to external entities.
 | |
|      */
 | |
|     else if ((ctxt->instate == XML_PARSER_ATTRIBUTE_VALUE) &&
 | |
| 	     (ent->etype == XML_EXTERNAL_GENERAL_PARSED_ENTITY)) {
 | |
| 	xmlFatalErrMsgStr(ctxt, XML_ERR_ENTITY_IS_EXTERNAL,
 | |
| 	 "Attribute references external entity '%s'\n", name);
 | |
|     }
 | |
|     /*
 | |
|      * [ WFC: No < in Attribute Values ]
 | |
|      * The replacement text of any entity referred to directly or
 | |
|      * indirectly in an attribute value (other than "<") must
 | |
|      * not contain a <.
 | |
|      */
 | |
|     else if ((ctxt->instate == XML_PARSER_ATTRIBUTE_VALUE) &&
 | |
| 	     (ent->etype != XML_INTERNAL_PREDEFINED_ENTITY)) {
 | |
| 	if ((ent->flags & XML_ENT_CHECKED_LT) == 0) {
 | |
|             if ((ent->content != NULL) && (xmlStrchr(ent->content, '<')))
 | |
|                 ent->flags |= XML_ENT_CONTAINS_LT;
 | |
|             ent->flags |= XML_ENT_CHECKED_LT;
 | |
|         }
 | |
|         if (ent->flags & XML_ENT_CONTAINS_LT)
 | |
|             xmlFatalErrMsgStr(ctxt, XML_ERR_LT_IN_ATTRIBUTE,
 | |
|                     "'<' in entity '%s' is not allowed in attributes "
 | |
|                     "values\n", name);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Internal check, no parameter entities here ...
 | |
|      */
 | |
|     else {
 | |
| 	switch (ent->etype) {
 | |
| 	    case XML_INTERNAL_PARAMETER_ENTITY:
 | |
| 	    case XML_EXTERNAL_PARAMETER_ENTITY:
 | |
| 		xmlFatalErrMsgStr(ctxt, XML_ERR_ENTITY_IS_PARAMETER,
 | |
| 	     "Attempt to reference the parameter entity '%s'\n",
 | |
| 				  name);
 | |
| 	    break;
 | |
| 	    default:
 | |
| 	    break;
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * [ WFC: No Recursion ]
 | |
|      * A parsed entity must not contain a recursive reference
 | |
|      * to itself, either directly or indirectly.
 | |
|      * Done somewhere else
 | |
|      */
 | |
| 
 | |
|     xmlFree(name);
 | |
|     *str = ptr;
 | |
|     return(ent);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParsePEReference:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse a parameter entity reference. Always consumes '%'.
 | |
|  *
 | |
|  * The entity content is handled directly by pushing it's content as
 | |
|  * a new input stream.
 | |
|  *
 | |
|  * [69] PEReference ::= '%' Name ';'
 | |
|  *
 | |
|  * [ WFC: No Recursion ]
 | |
|  * A parsed entity must not contain a recursive
 | |
|  * reference to itself, either directly or indirectly.
 | |
|  *
 | |
|  * [ WFC: Entity Declared ]
 | |
|  * In a document without any DTD, a document with only an internal DTD
 | |
|  * subset which contains no parameter entity references, or a document
 | |
|  * with "standalone='yes'", ...  ... The declaration of a parameter
 | |
|  * entity must precede any reference to it...
 | |
|  *
 | |
|  * [ VC: Entity Declared ]
 | |
|  * In a document with an external subset or external parameter entities
 | |
|  * with "standalone='no'", ...  ... The declaration of a parameter entity
 | |
|  * must precede any reference to it...
 | |
|  *
 | |
|  * [ WFC: In DTD ]
 | |
|  * Parameter-entity references may only appear in the DTD.
 | |
|  * NOTE: misleading but this is handled.
 | |
|  */
 | |
| void
 | |
| xmlParsePEReference(xmlParserCtxtPtr ctxt)
 | |
| {
 | |
|     const xmlChar *name;
 | |
|     xmlEntityPtr entity = NULL;
 | |
|     xmlParserInputPtr input;
 | |
| 
 | |
|     if (RAW != '%')
 | |
|         return;
 | |
|     NEXT;
 | |
|     name = xmlParseName(ctxt);
 | |
|     if (name == NULL) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_PEREF_NO_NAME, "PEReference: no name\n");
 | |
| 	return;
 | |
|     }
 | |
|     if (xmlParserDebugEntities)
 | |
| 	xmlGenericError(xmlGenericErrorContext,
 | |
| 		"PEReference: %s\n", name);
 | |
|     if (RAW != ';') {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_PEREF_SEMICOL_MISSING, NULL);
 | |
|         return;
 | |
|     }
 | |
| 
 | |
|     NEXT;
 | |
| 
 | |
|     /*
 | |
|      * Request the entity from SAX
 | |
|      */
 | |
|     if ((ctxt->sax != NULL) &&
 | |
| 	(ctxt->sax->getParameterEntity != NULL))
 | |
| 	entity = ctxt->sax->getParameterEntity(ctxt->userData, name);
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
| 	return;
 | |
|     if (entity == NULL) {
 | |
| 	/*
 | |
| 	 * [ WFC: Entity Declared ]
 | |
| 	 * In a document without any DTD, a document with only an
 | |
| 	 * internal DTD subset which contains no parameter entity
 | |
| 	 * references, or a document with "standalone='yes'", ...
 | |
| 	 * ... The declaration of a parameter entity must precede
 | |
| 	 * any reference to it...
 | |
| 	 */
 | |
| 	if ((ctxt->standalone == 1) ||
 | |
| 	    ((ctxt->hasExternalSubset == 0) &&
 | |
| 	     (ctxt->hasPErefs == 0))) {
 | |
| 	    xmlFatalErrMsgStr(ctxt, XML_ERR_UNDECLARED_ENTITY,
 | |
| 			      "PEReference: %%%s; not found\n",
 | |
| 			      name);
 | |
| 	} else {
 | |
| 	    /*
 | |
| 	     * [ VC: Entity Declared ]
 | |
| 	     * In a document with an external subset or external
 | |
| 	     * parameter entities with "standalone='no'", ...
 | |
| 	     * ... The declaration of a parameter entity must
 | |
| 	     * precede any reference to it...
 | |
| 	     */
 | |
|             if ((ctxt->validate) && (ctxt->vctxt.error != NULL)) {
 | |
|                 xmlValidityError(ctxt, XML_WAR_UNDECLARED_ENTITY,
 | |
|                                  "PEReference: %%%s; not found\n",
 | |
|                                  name, NULL);
 | |
|             } else
 | |
|                 xmlWarningMsg(ctxt, XML_WAR_UNDECLARED_ENTITY,
 | |
|                               "PEReference: %%%s; not found\n",
 | |
|                               name, NULL);
 | |
|             ctxt->valid = 0;
 | |
| 	}
 | |
|     } else {
 | |
| 	/*
 | |
| 	 * Internal checking in case the entity quest barfed
 | |
| 	 */
 | |
| 	if ((entity->etype != XML_INTERNAL_PARAMETER_ENTITY) &&
 | |
| 	    (entity->etype != XML_EXTERNAL_PARAMETER_ENTITY)) {
 | |
| 	    xmlWarningMsg(ctxt, XML_WAR_UNDECLARED_ENTITY,
 | |
| 		  "Internal: %%%s; is not a parameter entity\n",
 | |
| 			  name, NULL);
 | |
| 	} else {
 | |
|             unsigned long parentConsumed;
 | |
|             xmlEntityPtr oldEnt;
 | |
| 
 | |
| 	    if ((entity->etype == XML_EXTERNAL_PARAMETER_ENTITY) &&
 | |
| 	        ((ctxt->options & XML_PARSE_NOENT) == 0) &&
 | |
| 		((ctxt->options & XML_PARSE_DTDVALID) == 0) &&
 | |
| 		((ctxt->options & XML_PARSE_DTDLOAD) == 0) &&
 | |
| 		((ctxt->options & XML_PARSE_DTDATTR) == 0) &&
 | |
| 		(ctxt->replaceEntities == 0) &&
 | |
| 		(ctxt->validate == 0))
 | |
| 		return;
 | |
| 
 | |
|             if (entity->flags & XML_ENT_EXPANDING) {
 | |
|                 xmlFatalErr(ctxt, XML_ERR_ENTITY_LOOP, NULL);
 | |
|                 xmlHaltParser(ctxt);
 | |
|                 return;
 | |
|             }
 | |
| 
 | |
|             /* Must be computed from old input before pushing new input. */
 | |
|             parentConsumed = ctxt->input->parentConsumed;
 | |
|             oldEnt = ctxt->input->entity;
 | |
|             if ((oldEnt == NULL) ||
 | |
|                 ((oldEnt->etype == XML_EXTERNAL_PARAMETER_ENTITY) &&
 | |
|                  ((oldEnt->flags & XML_ENT_PARSED) == 0))) {
 | |
|                 xmlSaturatedAdd(&parentConsumed, ctxt->input->consumed);
 | |
|                 xmlSaturatedAddSizeT(&parentConsumed,
 | |
|                                      ctxt->input->cur - ctxt->input->base);
 | |
|             }
 | |
| 
 | |
| 	    input = xmlNewEntityInputStream(ctxt, entity);
 | |
| 	    if (xmlPushInput(ctxt, input) < 0) {
 | |
|                 xmlFreeInputStream(input);
 | |
| 		return;
 | |
|             }
 | |
| 
 | |
|             entity->flags |= XML_ENT_EXPANDING;
 | |
| 
 | |
|             input->parentConsumed = parentConsumed;
 | |
| 
 | |
| 	    if (entity->etype == XML_EXTERNAL_PARAMETER_ENTITY) {
 | |
|                 xmlDetectEncoding(ctxt);
 | |
| 
 | |
|                 if ((CMP5(CUR_PTR, '<', '?', 'x', 'm', 'l')) &&
 | |
|                     (IS_BLANK_CH(NXT(5)))) {
 | |
|                     xmlParseTextDecl(ctxt);
 | |
|                 }
 | |
|             }
 | |
| 	}
 | |
|     }
 | |
|     ctxt->hasPErefs = 1;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlLoadEntityContent:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @entity: an unloaded system entity
 | |
|  *
 | |
|  * Load the original content of the given system entity from the
 | |
|  * ExternalID/SystemID given. This is to be used for Included in Literal
 | |
|  * http://www.w3.org/TR/REC-xml/#inliteral processing of entities references
 | |
|  *
 | |
|  * Returns 0 in case of success and -1 in case of failure
 | |
|  */
 | |
| static int
 | |
| xmlLoadEntityContent(xmlParserCtxtPtr ctxt, xmlEntityPtr entity) {
 | |
|     xmlParserInputPtr oldinput, input = NULL;
 | |
|     xmlParserInputPtr *oldinputTab;
 | |
|     const xmlChar *oldencoding;
 | |
|     xmlChar *content = NULL;
 | |
|     size_t length, i;
 | |
|     int oldinputNr, oldinputMax, oldprogressive;
 | |
|     int ret = -1;
 | |
|     int res;
 | |
| 
 | |
|     if ((ctxt == NULL) || (entity == NULL) ||
 | |
|         ((entity->etype != XML_EXTERNAL_PARAMETER_ENTITY) &&
 | |
| 	 (entity->etype != XML_EXTERNAL_GENERAL_PARSED_ENTITY)) ||
 | |
| 	(entity->content != NULL)) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
| 	            "xmlLoadEntityContent parameter error");
 | |
|         return(-1);
 | |
|     }
 | |
| 
 | |
|     if (xmlParserDebugEntities)
 | |
| 	xmlGenericError(xmlGenericErrorContext,
 | |
| 		"Reading %s entity content input\n", entity->name);
 | |
| 
 | |
|     input = xmlLoadExternalEntity((char *) entity->URI,
 | |
|            (char *) entity->ExternalID, ctxt);
 | |
|     if (input == NULL) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
| 	            "xmlLoadEntityContent input error");
 | |
|         return(-1);
 | |
|     }
 | |
| 
 | |
|     oldinput = ctxt->input;
 | |
|     oldinputNr = ctxt->inputNr;
 | |
|     oldinputMax = ctxt->inputMax;
 | |
|     oldinputTab = ctxt->inputTab;
 | |
|     oldencoding = ctxt->encoding;
 | |
|     oldprogressive = ctxt->progressive;
 | |
| 
 | |
|     ctxt->input = NULL;
 | |
|     ctxt->inputNr = 0;
 | |
|     ctxt->inputMax = 1;
 | |
|     ctxt->encoding = NULL;
 | |
|     ctxt->progressive = 0;
 | |
|     ctxt->inputTab = xmlMalloc(sizeof(xmlParserInputPtr));
 | |
|     if (ctxt->inputTab == NULL) {
 | |
|         xmlErrMemory(ctxt, NULL);
 | |
|         xmlFreeInputStream(input);
 | |
|         goto error;
 | |
|     }
 | |
| 
 | |
|     xmlBufResetInput(input->buf->buffer, input);
 | |
| 
 | |
|     inputPush(ctxt, input);
 | |
| 
 | |
|     xmlDetectEncoding(ctxt);
 | |
| 
 | |
|     /*
 | |
|      * Parse a possible text declaration first
 | |
|      */
 | |
|     if ((CMP5(CUR_PTR, '<', '?', 'x', 'm', 'l')) && (IS_BLANK_CH(NXT(5)))) {
 | |
| 	xmlParseTextDecl(ctxt);
 | |
|         /*
 | |
|          * An XML-1.0 document can't reference an entity not XML-1.0
 | |
|          */
 | |
|         if ((xmlStrEqual(ctxt->version, BAD_CAST "1.0")) &&
 | |
|             (!xmlStrEqual(ctxt->input->version, BAD_CAST "1.0"))) {
 | |
|             xmlFatalErrMsg(ctxt, XML_ERR_VERSION_MISMATCH,
 | |
|                            "Version mismatch between document and entity\n");
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         goto error;
 | |
| 
 | |
|     length = input->cur - input->base;
 | |
|     xmlBufShrink(input->buf->buffer, length);
 | |
|     xmlSaturatedAdd(&ctxt->sizeentities, length);
 | |
| 
 | |
|     while ((res = xmlParserInputBufferGrow(input->buf, 4096)) > 0)
 | |
|         ;
 | |
| 
 | |
|     xmlBufResetInput(input->buf->buffer, input);
 | |
| 
 | |
|     if (res < 0) {
 | |
|         xmlFatalErr(ctxt, input->buf->error, NULL);
 | |
|         goto error;
 | |
|     }
 | |
| 
 | |
|     length = xmlBufUse(input->buf->buffer);
 | |
|     content = xmlBufDetach(input->buf->buffer);
 | |
| 
 | |
|     if (length > INT_MAX) {
 | |
|         xmlErrMemory(ctxt, NULL);
 | |
|         goto error;
 | |
|     }
 | |
| 
 | |
|     for (i = 0; i < length; ) {
 | |
|         int clen = length - i;
 | |
|         int c = xmlGetUTF8Char(content + i, &clen);
 | |
| 
 | |
|         if ((c < 0) || (!IS_CHAR(c))) {
 | |
|             xmlFatalErrMsgInt(ctxt, XML_ERR_INVALID_CHAR,
 | |
|                               "xmlLoadEntityContent: invalid char value %d\n",
 | |
|                               content[i]);
 | |
|             goto error;
 | |
|         }
 | |
|         i += clen;
 | |
|     }
 | |
| 
 | |
|     xmlSaturatedAdd(&ctxt->sizeentities, length);
 | |
|     entity->content = content;
 | |
|     entity->length = length;
 | |
|     content = NULL;
 | |
|     ret = 0;
 | |
| 
 | |
| error:
 | |
|     while (ctxt->inputNr > 0)
 | |
|         xmlFreeInputStream(inputPop(ctxt));
 | |
|     xmlFree(ctxt->inputTab);
 | |
|     xmlFree((xmlChar *) ctxt->encoding);
 | |
| 
 | |
|     ctxt->input = oldinput;
 | |
|     ctxt->inputNr = oldinputNr;
 | |
|     ctxt->inputMax = oldinputMax;
 | |
|     ctxt->inputTab = oldinputTab;
 | |
|     ctxt->encoding = oldencoding;
 | |
|     ctxt->progressive = oldprogressive;
 | |
| 
 | |
|     xmlFree(content);
 | |
| 
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseStringPEReference:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @str:  a pointer to an index in the string
 | |
|  *
 | |
|  * parse PEReference declarations
 | |
|  *
 | |
|  * [69] PEReference ::= '%' Name ';'
 | |
|  *
 | |
|  * [ WFC: No Recursion ]
 | |
|  * A parsed entity must not contain a recursive
 | |
|  * reference to itself, either directly or indirectly.
 | |
|  *
 | |
|  * [ WFC: Entity Declared ]
 | |
|  * In a document without any DTD, a document with only an internal DTD
 | |
|  * subset which contains no parameter entity references, or a document
 | |
|  * with "standalone='yes'", ...  ... The declaration of a parameter
 | |
|  * entity must precede any reference to it...
 | |
|  *
 | |
|  * [ VC: Entity Declared ]
 | |
|  * In a document with an external subset or external parameter entities
 | |
|  * with "standalone='no'", ...  ... The declaration of a parameter entity
 | |
|  * must precede any reference to it...
 | |
|  *
 | |
|  * [ WFC: In DTD ]
 | |
|  * Parameter-entity references may only appear in the DTD.
 | |
|  * NOTE: misleading but this is handled.
 | |
|  *
 | |
|  * Returns the string of the entity content.
 | |
|  *         str is updated to the current value of the index
 | |
|  */
 | |
| static xmlEntityPtr
 | |
| xmlParseStringPEReference(xmlParserCtxtPtr ctxt, const xmlChar **str) {
 | |
|     const xmlChar *ptr;
 | |
|     xmlChar cur;
 | |
|     xmlChar *name;
 | |
|     xmlEntityPtr entity = NULL;
 | |
| 
 | |
|     if ((str == NULL) || (*str == NULL)) return(NULL);
 | |
|     ptr = *str;
 | |
|     cur = *ptr;
 | |
|     if (cur != '%')
 | |
|         return(NULL);
 | |
|     ptr++;
 | |
|     name = xmlParseStringName(ctxt, &ptr);
 | |
|     if (name == NULL) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 		       "xmlParseStringPEReference: no name\n");
 | |
| 	*str = ptr;
 | |
| 	return(NULL);
 | |
|     }
 | |
|     cur = *ptr;
 | |
|     if (cur != ';') {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_ENTITYREF_SEMICOL_MISSING, NULL);
 | |
| 	xmlFree(name);
 | |
| 	*str = ptr;
 | |
| 	return(NULL);
 | |
|     }
 | |
|     ptr++;
 | |
| 
 | |
|     /*
 | |
|      * Request the entity from SAX
 | |
|      */
 | |
|     if ((ctxt->sax != NULL) &&
 | |
| 	(ctxt->sax->getParameterEntity != NULL))
 | |
| 	entity = ctxt->sax->getParameterEntity(ctxt->userData, name);
 | |
|     if (ctxt->instate == XML_PARSER_EOF) {
 | |
| 	xmlFree(name);
 | |
| 	*str = ptr;
 | |
| 	return(NULL);
 | |
|     }
 | |
|     if (entity == NULL) {
 | |
| 	/*
 | |
| 	 * [ WFC: Entity Declared ]
 | |
| 	 * In a document without any DTD, a document with only an
 | |
| 	 * internal DTD subset which contains no parameter entity
 | |
| 	 * references, or a document with "standalone='yes'", ...
 | |
| 	 * ... The declaration of a parameter entity must precede
 | |
| 	 * any reference to it...
 | |
| 	 */
 | |
| 	if ((ctxt->standalone == 1) ||
 | |
| 	    ((ctxt->hasExternalSubset == 0) && (ctxt->hasPErefs == 0))) {
 | |
| 	    xmlFatalErrMsgStr(ctxt, XML_ERR_UNDECLARED_ENTITY,
 | |
| 		 "PEReference: %%%s; not found\n", name);
 | |
| 	} else {
 | |
| 	    /*
 | |
| 	     * [ VC: Entity Declared ]
 | |
| 	     * In a document with an external subset or external
 | |
| 	     * parameter entities with "standalone='no'", ...
 | |
| 	     * ... The declaration of a parameter entity must
 | |
| 	     * precede any reference to it...
 | |
| 	     */
 | |
| 	    xmlWarningMsg(ctxt, XML_WAR_UNDECLARED_ENTITY,
 | |
| 			  "PEReference: %%%s; not found\n",
 | |
| 			  name, NULL);
 | |
| 	    ctxt->valid = 0;
 | |
| 	}
 | |
|     } else {
 | |
| 	/*
 | |
| 	 * Internal checking in case the entity quest barfed
 | |
| 	 */
 | |
| 	if ((entity->etype != XML_INTERNAL_PARAMETER_ENTITY) &&
 | |
| 	    (entity->etype != XML_EXTERNAL_PARAMETER_ENTITY)) {
 | |
| 	    xmlWarningMsg(ctxt, XML_WAR_UNDECLARED_ENTITY,
 | |
| 			  "%%%s; is not a parameter entity\n",
 | |
| 			  name, NULL);
 | |
| 	}
 | |
|     }
 | |
|     ctxt->hasPErefs = 1;
 | |
|     xmlFree(name);
 | |
|     *str = ptr;
 | |
|     return(entity);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseDocTypeDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse a DOCTYPE declaration
 | |
|  *
 | |
|  * [28] doctypedecl ::= '<!DOCTYPE' S Name (S ExternalID)? S?
 | |
|  *                      ('[' (markupdecl | PEReference | S)* ']' S?)? '>'
 | |
|  *
 | |
|  * [ VC: Root Element Type ]
 | |
|  * The Name in the document type declaration must match the element
 | |
|  * type of the root element.
 | |
|  */
 | |
| 
 | |
| void
 | |
| xmlParseDocTypeDecl(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *name = NULL;
 | |
|     xmlChar *ExternalID = NULL;
 | |
|     xmlChar *URI = NULL;
 | |
| 
 | |
|     /*
 | |
|      * We know that '<!DOCTYPE' has been detected.
 | |
|      */
 | |
|     SKIP(9);
 | |
| 
 | |
|     SKIP_BLANKS;
 | |
| 
 | |
|     /*
 | |
|      * Parse the DOCTYPE name.
 | |
|      */
 | |
|     name = xmlParseName(ctxt);
 | |
|     if (name == NULL) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 		       "xmlParseDocTypeDecl : no DOCTYPE name !\n");
 | |
|     }
 | |
|     ctxt->intSubName = name;
 | |
| 
 | |
|     SKIP_BLANKS;
 | |
| 
 | |
|     /*
 | |
|      * Check for SystemID and ExternalID
 | |
|      */
 | |
|     URI = xmlParseExternalID(ctxt, &ExternalID, 1);
 | |
| 
 | |
|     if ((URI != NULL) || (ExternalID != NULL)) {
 | |
|         ctxt->hasExternalSubset = 1;
 | |
|     }
 | |
|     ctxt->extSubURI = URI;
 | |
|     ctxt->extSubSystem = ExternalID;
 | |
| 
 | |
|     SKIP_BLANKS;
 | |
| 
 | |
|     /*
 | |
|      * Create and update the internal subset.
 | |
|      */
 | |
|     if ((ctxt->sax != NULL) && (ctxt->sax->internalSubset != NULL) &&
 | |
| 	(!ctxt->disableSAX))
 | |
| 	ctxt->sax->internalSubset(ctxt->userData, name, ExternalID, URI);
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
| 	return;
 | |
| 
 | |
|     /*
 | |
|      * Is there any internal subset declarations ?
 | |
|      * they are handled separately in xmlParseInternalSubset()
 | |
|      */
 | |
|     if (RAW == '[')
 | |
| 	return;
 | |
| 
 | |
|     /*
 | |
|      * We should be at the end of the DOCTYPE declaration.
 | |
|      */
 | |
|     if (RAW != '>') {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_DOCTYPE_NOT_FINISHED, NULL);
 | |
|     }
 | |
|     NEXT;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseInternalSubset:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * parse the internal subset declaration
 | |
|  *
 | |
|  * [28 end] ('[' (markupdecl | PEReference | S)* ']' S?)? '>'
 | |
|  */
 | |
| 
 | |
| static void
 | |
| xmlParseInternalSubset(xmlParserCtxtPtr ctxt) {
 | |
|     /*
 | |
|      * Is there any DTD definition ?
 | |
|      */
 | |
|     if (RAW == '[') {
 | |
|         int baseInputNr = ctxt->inputNr;
 | |
|         ctxt->instate = XML_PARSER_DTD;
 | |
|         NEXT;
 | |
| 	/*
 | |
| 	 * Parse the succession of Markup declarations and
 | |
| 	 * PEReferences.
 | |
| 	 * Subsequence (markupdecl | PEReference | S)*
 | |
| 	 */
 | |
| 	SKIP_BLANKS;
 | |
| 	while (((RAW != ']') || (ctxt->inputNr > baseInputNr)) &&
 | |
|                (ctxt->instate != XML_PARSER_EOF)) {
 | |
| 
 | |
|             /*
 | |
|              * Conditional sections are allowed from external entities included
 | |
|              * by PE References in the internal subset.
 | |
|              */
 | |
|             if ((ctxt->inputNr > 1) && (ctxt->input->filename != NULL) &&
 | |
|                 (RAW == '<') && (NXT(1) == '!') && (NXT(2) == '[')) {
 | |
|                 xmlParseConditionalSections(ctxt);
 | |
|             } else if ((RAW == '<') && ((NXT(1) == '!') || (NXT(1) == '?'))) {
 | |
| 	        xmlParseMarkupDecl(ctxt);
 | |
|             } else if (RAW == '%') {
 | |
| 	        xmlParsePEReference(ctxt);
 | |
|             } else {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
|                         "xmlParseInternalSubset: error detected in"
 | |
|                         " Markup declaration\n");
 | |
|                 xmlHaltParser(ctxt);
 | |
|                 return;
 | |
|             }
 | |
| 	    SKIP_BLANKS;
 | |
|             SHRINK;
 | |
|             GROW;
 | |
| 	}
 | |
| 	if (RAW == ']') {
 | |
| 	    NEXT;
 | |
| 	    SKIP_BLANKS;
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * We should be at the end of the DOCTYPE declaration.
 | |
|      */
 | |
|     if (RAW != '>') {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_DOCTYPE_NOT_FINISHED, NULL);
 | |
| 	return;
 | |
|     }
 | |
|     NEXT;
 | |
| }
 | |
| 
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
| /**
 | |
|  * xmlParseAttribute:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @value:  a xmlChar ** used to store the value of the attribute
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an attribute
 | |
|  *
 | |
|  * [41] Attribute ::= Name Eq AttValue
 | |
|  *
 | |
|  * [ WFC: No External Entity References ]
 | |
|  * Attribute values cannot contain direct or indirect entity references
 | |
|  * to external entities.
 | |
|  *
 | |
|  * [ WFC: No < in Attribute Values ]
 | |
|  * The replacement text of any entity referred to directly or indirectly in
 | |
|  * an attribute value (other than "<") must not contain a <.
 | |
|  *
 | |
|  * [ VC: Attribute Value Type ]
 | |
|  * The attribute must have been declared; the value must be of the type
 | |
|  * declared for it.
 | |
|  *
 | |
|  * [25] Eq ::= S? '=' S?
 | |
|  *
 | |
|  * With namespace:
 | |
|  *
 | |
|  * [NS 11] Attribute ::= QName Eq AttValue
 | |
|  *
 | |
|  * Also the case QName == xmlns:??? is handled independently as a namespace
 | |
|  * definition.
 | |
|  *
 | |
|  * Returns the attribute name, and the value in *value.
 | |
|  */
 | |
| 
 | |
| const xmlChar *
 | |
| xmlParseAttribute(xmlParserCtxtPtr ctxt, xmlChar **value) {
 | |
|     const xmlChar *name;
 | |
|     xmlChar *val;
 | |
| 
 | |
|     *value = NULL;
 | |
|     GROW;
 | |
|     name = xmlParseName(ctxt);
 | |
|     if (name == NULL) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 	               "error parsing attribute name\n");
 | |
|         return(NULL);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * read the value
 | |
|      */
 | |
|     SKIP_BLANKS;
 | |
|     if (RAW == '=') {
 | |
|         NEXT;
 | |
| 	SKIP_BLANKS;
 | |
| 	val = xmlParseAttValue(ctxt);
 | |
| 	ctxt->instate = XML_PARSER_CONTENT;
 | |
|     } else {
 | |
| 	xmlFatalErrMsgStr(ctxt, XML_ERR_ATTRIBUTE_WITHOUT_VALUE,
 | |
| 	       "Specification mandates value for attribute %s\n", name);
 | |
| 	return(name);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Check that xml:lang conforms to the specification
 | |
|      * No more registered as an error, just generate a warning now
 | |
|      * since this was deprecated in XML second edition
 | |
|      */
 | |
|     if ((ctxt->pedantic) && (xmlStrEqual(name, BAD_CAST "xml:lang"))) {
 | |
| 	if (!xmlCheckLanguageID(val)) {
 | |
| 	    xmlWarningMsg(ctxt, XML_WAR_LANG_VALUE,
 | |
| 		          "Malformed value for xml:lang : %s\n",
 | |
| 			  val, NULL);
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Check that xml:space conforms to the specification
 | |
|      */
 | |
|     if (xmlStrEqual(name, BAD_CAST "xml:space")) {
 | |
| 	if (xmlStrEqual(val, BAD_CAST "default"))
 | |
| 	    *(ctxt->space) = 0;
 | |
| 	else if (xmlStrEqual(val, BAD_CAST "preserve"))
 | |
| 	    *(ctxt->space) = 1;
 | |
| 	else {
 | |
| 		xmlWarningMsg(ctxt, XML_WAR_SPACE_VALUE,
 | |
| "Invalid value \"%s\" for xml:space : \"default\" or \"preserve\" expected\n",
 | |
|                                  val, NULL);
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     *value = val;
 | |
|     return(name);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseStartTag:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse a start tag. Always consumes '<'.
 | |
|  *
 | |
|  * [40] STag ::= '<' Name (S Attribute)* S? '>'
 | |
|  *
 | |
|  * [ WFC: Unique Att Spec ]
 | |
|  * No attribute name may appear more than once in the same start-tag or
 | |
|  * empty-element tag.
 | |
|  *
 | |
|  * [44] EmptyElemTag ::= '<' Name (S Attribute)* S? '/>'
 | |
|  *
 | |
|  * [ WFC: Unique Att Spec ]
 | |
|  * No attribute name may appear more than once in the same start-tag or
 | |
|  * empty-element tag.
 | |
|  *
 | |
|  * With namespace:
 | |
|  *
 | |
|  * [NS 8] STag ::= '<' QName (S Attribute)* S? '>'
 | |
|  *
 | |
|  * [NS 10] EmptyElement ::= '<' QName (S Attribute)* S? '/>'
 | |
|  *
 | |
|  * Returns the element name parsed
 | |
|  */
 | |
| 
 | |
| const xmlChar *
 | |
| xmlParseStartTag(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *name;
 | |
|     const xmlChar *attname;
 | |
|     xmlChar *attvalue;
 | |
|     const xmlChar **atts = ctxt->atts;
 | |
|     int nbatts = 0;
 | |
|     int maxatts = ctxt->maxatts;
 | |
|     int i;
 | |
| 
 | |
|     if (RAW != '<') return(NULL);
 | |
|     NEXT1;
 | |
| 
 | |
|     name = xmlParseName(ctxt);
 | |
|     if (name == NULL) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 	     "xmlParseStartTag: invalid element name\n");
 | |
|         return(NULL);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Now parse the attributes, it ends up with the ending
 | |
|      *
 | |
|      * (S Attribute)* S?
 | |
|      */
 | |
|     SKIP_BLANKS;
 | |
|     GROW;
 | |
| 
 | |
|     while (((RAW != '>') &&
 | |
| 	   ((RAW != '/') || (NXT(1) != '>')) &&
 | |
| 	   (IS_BYTE_CHAR(RAW))) && (ctxt->instate != XML_PARSER_EOF)) {
 | |
| 	attname = xmlParseAttribute(ctxt, &attvalue);
 | |
|         if (attname == NULL) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
| 			   "xmlParseStartTag: problem parsing attributes\n");
 | |
| 	    break;
 | |
| 	}
 | |
|         if (attvalue != NULL) {
 | |
| 	    /*
 | |
| 	     * [ WFC: Unique Att Spec ]
 | |
| 	     * No attribute name may appear more than once in the same
 | |
| 	     * start-tag or empty-element tag.
 | |
| 	     */
 | |
| 	    for (i = 0; i < nbatts;i += 2) {
 | |
| 	        if (xmlStrEqual(atts[i], attname)) {
 | |
| 		    xmlErrAttributeDup(ctxt, NULL, attname);
 | |
| 		    xmlFree(attvalue);
 | |
| 		    goto failed;
 | |
| 		}
 | |
| 	    }
 | |
| 	    /*
 | |
| 	     * Add the pair to atts
 | |
| 	     */
 | |
| 	    if (atts == NULL) {
 | |
| 	        maxatts = 22; /* allow for 10 attrs by default */
 | |
| 	        atts = (const xmlChar **)
 | |
| 		       xmlMalloc(maxatts * sizeof(xmlChar *));
 | |
| 		if (atts == NULL) {
 | |
| 		    xmlErrMemory(ctxt, NULL);
 | |
| 		    if (attvalue != NULL)
 | |
| 			xmlFree(attvalue);
 | |
| 		    goto failed;
 | |
| 		}
 | |
| 		ctxt->atts = atts;
 | |
| 		ctxt->maxatts = maxatts;
 | |
| 	    } else if (nbatts + 4 > maxatts) {
 | |
| 	        const xmlChar **n;
 | |
| 
 | |
| 	        maxatts *= 2;
 | |
| 	        n = (const xmlChar **) xmlRealloc((void *) atts,
 | |
| 					     maxatts * sizeof(const xmlChar *));
 | |
| 		if (n == NULL) {
 | |
| 		    xmlErrMemory(ctxt, NULL);
 | |
| 		    if (attvalue != NULL)
 | |
| 			xmlFree(attvalue);
 | |
| 		    goto failed;
 | |
| 		}
 | |
| 		atts = n;
 | |
| 		ctxt->atts = atts;
 | |
| 		ctxt->maxatts = maxatts;
 | |
| 	    }
 | |
| 	    atts[nbatts++] = attname;
 | |
| 	    atts[nbatts++] = attvalue;
 | |
| 	    atts[nbatts] = NULL;
 | |
| 	    atts[nbatts + 1] = NULL;
 | |
| 	} else {
 | |
| 	    if (attvalue != NULL)
 | |
| 		xmlFree(attvalue);
 | |
| 	}
 | |
| 
 | |
| failed:
 | |
| 
 | |
| 	GROW
 | |
| 	if ((RAW == '>') || (((RAW == '/') && (NXT(1) == '>'))))
 | |
| 	    break;
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			   "attributes construct error\n");
 | |
| 	}
 | |
| 	SHRINK;
 | |
|         GROW;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * SAX: Start of Element !
 | |
|      */
 | |
|     if ((ctxt->sax != NULL) && (ctxt->sax->startElement != NULL) &&
 | |
| 	(!ctxt->disableSAX)) {
 | |
| 	if (nbatts > 0)
 | |
| 	    ctxt->sax->startElement(ctxt->userData, name, atts);
 | |
| 	else
 | |
| 	    ctxt->sax->startElement(ctxt->userData, name, NULL);
 | |
|     }
 | |
| 
 | |
|     if (atts != NULL) {
 | |
|         /* Free only the content strings */
 | |
|         for (i = 1;i < nbatts;i+=2)
 | |
| 	    if (atts[i] != NULL)
 | |
| 	       xmlFree((xmlChar *) atts[i]);
 | |
|     }
 | |
|     return(name);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseEndTag1:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @line:  line of the start tag
 | |
|  * @nsNr:  number of namespaces on the start tag
 | |
|  *
 | |
|  * Parse an end tag. Always consumes '</'.
 | |
|  *
 | |
|  * [42] ETag ::= '</' Name S? '>'
 | |
|  *
 | |
|  * With namespace
 | |
|  *
 | |
|  * [NS 9] ETag ::= '</' QName S? '>'
 | |
|  */
 | |
| 
 | |
| static void
 | |
| xmlParseEndTag1(xmlParserCtxtPtr ctxt, int line) {
 | |
|     const xmlChar *name;
 | |
| 
 | |
|     GROW;
 | |
|     if ((RAW != '<') || (NXT(1) != '/')) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_LTSLASH_REQUIRED,
 | |
| 		       "xmlParseEndTag: '</' not found\n");
 | |
| 	return;
 | |
|     }
 | |
|     SKIP(2);
 | |
| 
 | |
|     name = xmlParseNameAndCompare(ctxt,ctxt->name);
 | |
| 
 | |
|     /*
 | |
|      * We should definitely be at the ending "S? '>'" part
 | |
|      */
 | |
|     GROW;
 | |
|     SKIP_BLANKS;
 | |
|     if ((!IS_BYTE_CHAR(RAW)) || (RAW != '>')) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_GT_REQUIRED, NULL);
 | |
|     } else
 | |
| 	NEXT1;
 | |
| 
 | |
|     /*
 | |
|      * [ WFC: Element Type Match ]
 | |
|      * The Name in an element's end-tag must match the element type in the
 | |
|      * start-tag.
 | |
|      *
 | |
|      */
 | |
|     if (name != (xmlChar*)1) {
 | |
|         if (name == NULL) name = BAD_CAST "unparsable";
 | |
|         xmlFatalErrMsgStrIntStr(ctxt, XML_ERR_TAG_NAME_MISMATCH,
 | |
| 		     "Opening and ending tag mismatch: %s line %d and %s\n",
 | |
| 		                ctxt->name, line, name);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * SAX: End of Tag
 | |
|      */
 | |
|     if ((ctxt->sax != NULL) && (ctxt->sax->endElement != NULL) &&
 | |
| 	(!ctxt->disableSAX))
 | |
|         ctxt->sax->endElement(ctxt->userData, ctxt->name);
 | |
| 
 | |
|     namePop(ctxt);
 | |
|     spacePop(ctxt);
 | |
|     return;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseEndTag:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an end of tag
 | |
|  *
 | |
|  * [42] ETag ::= '</' Name S? '>'
 | |
|  *
 | |
|  * With namespace
 | |
|  *
 | |
|  * [NS 9] ETag ::= '</' QName S? '>'
 | |
|  */
 | |
| 
 | |
| void
 | |
| xmlParseEndTag(xmlParserCtxtPtr ctxt) {
 | |
|     xmlParseEndTag1(ctxt, 0);
 | |
| }
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		      SAX 2 specific operations				*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * xmlParseQNameHashed:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @prefix:  pointer to store the prefix part
 | |
|  *
 | |
|  * parse an XML Namespace QName
 | |
|  *
 | |
|  * [6]  QName  ::= (Prefix ':')? LocalPart
 | |
|  * [7]  Prefix  ::= NCName
 | |
|  * [8]  LocalPart  ::= NCName
 | |
|  *
 | |
|  * Returns the Name parsed or NULL
 | |
|  */
 | |
| 
 | |
| static xmlHashedString
 | |
| xmlParseQNameHashed(xmlParserCtxtPtr ctxt, xmlHashedString *prefix) {
 | |
|     xmlHashedString l, p;
 | |
|     int start;
 | |
| 
 | |
|     l.name = NULL;
 | |
|     p.name = NULL;
 | |
| 
 | |
|     GROW;
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return(l);
 | |
|     start = CUR_PTR - BASE_PTR;
 | |
| 
 | |
|     l = xmlParseNCName(ctxt);
 | |
|     if ((l.name != NULL) && (CUR == ':')) {
 | |
|         NEXT;
 | |
| 	p = l;
 | |
| 	l = xmlParseNCName(ctxt);
 | |
|     }
 | |
|     if ((l.name == NULL) || (CUR == ':')) {
 | |
|         xmlChar *tmp;
 | |
| 
 | |
|         l.name = NULL;
 | |
|         p.name = NULL;
 | |
|         if (ctxt->instate == XML_PARSER_EOF)
 | |
|             return(l);
 | |
|         if ((CUR != ':') && (CUR_PTR <= BASE_PTR + start))
 | |
|             return(l);
 | |
|         tmp = xmlParseNmtoken(ctxt);
 | |
|         if (tmp != NULL)
 | |
|             xmlFree(tmp);
 | |
|         if (ctxt->instate == XML_PARSER_EOF)
 | |
|             return(l);
 | |
|         l = xmlDictLookupHashed(ctxt->dict, BASE_PTR + start,
 | |
|                                 CUR_PTR - (BASE_PTR + start));
 | |
|         xmlNsErr(ctxt, XML_NS_ERR_QNAME,
 | |
|                  "Failed to parse QName '%s'\n", l.name, NULL, NULL);
 | |
|     }
 | |
| 
 | |
|     *prefix = p;
 | |
|     return(l);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseQName:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @prefix:  pointer to store the prefix part
 | |
|  *
 | |
|  * parse an XML Namespace QName
 | |
|  *
 | |
|  * [6]  QName  ::= (Prefix ':')? LocalPart
 | |
|  * [7]  Prefix  ::= NCName
 | |
|  * [8]  LocalPart  ::= NCName
 | |
|  *
 | |
|  * Returns the Name parsed or NULL
 | |
|  */
 | |
| 
 | |
| static const xmlChar *
 | |
| xmlParseQName(xmlParserCtxtPtr ctxt, const xmlChar **prefix) {
 | |
|     xmlHashedString n, p;
 | |
| 
 | |
|     n = xmlParseQNameHashed(ctxt, &p);
 | |
|     if (n.name == NULL)
 | |
|         return(NULL);
 | |
|     *prefix = p.name;
 | |
|     return(n.name);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseQNameAndCompare:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @name:  the localname
 | |
|  * @prefix:  the prefix, if any.
 | |
|  *
 | |
|  * parse an XML name and compares for match
 | |
|  * (specialized for endtag parsing)
 | |
|  *
 | |
|  * Returns NULL for an illegal name, (xmlChar*) 1 for success
 | |
|  * and the name for mismatch
 | |
|  */
 | |
| 
 | |
| static const xmlChar *
 | |
| xmlParseQNameAndCompare(xmlParserCtxtPtr ctxt, xmlChar const *name,
 | |
|                         xmlChar const *prefix) {
 | |
|     const xmlChar *cmp;
 | |
|     const xmlChar *in;
 | |
|     const xmlChar *ret;
 | |
|     const xmlChar *prefix2;
 | |
| 
 | |
|     if (prefix == NULL) return(xmlParseNameAndCompare(ctxt, name));
 | |
| 
 | |
|     GROW;
 | |
|     in = ctxt->input->cur;
 | |
| 
 | |
|     cmp = prefix;
 | |
|     while (*in != 0 && *in == *cmp) {
 | |
| 	++in;
 | |
| 	++cmp;
 | |
|     }
 | |
|     if ((*cmp == 0) && (*in == ':')) {
 | |
|         in++;
 | |
| 	cmp = name;
 | |
| 	while (*in != 0 && *in == *cmp) {
 | |
| 	    ++in;
 | |
| 	    ++cmp;
 | |
| 	}
 | |
| 	if (*cmp == 0 && (*in == '>' || IS_BLANK_CH (*in))) {
 | |
| 	    /* success */
 | |
|             ctxt->input->col += in - ctxt->input->cur;
 | |
| 	    ctxt->input->cur = in;
 | |
| 	    return((const xmlChar*) 1);
 | |
| 	}
 | |
|     }
 | |
|     /*
 | |
|      * all strings coms from the dictionary, equality can be done directly
 | |
|      */
 | |
|     ret = xmlParseQName (ctxt, &prefix2);
 | |
|     if (ret == NULL)
 | |
|         return(NULL);
 | |
|     if ((ret == name) && (prefix == prefix2))
 | |
| 	return((const xmlChar*) 1);
 | |
|     return ret;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseAttValueInternal:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @len:  attribute len result
 | |
|  * @alloc:  whether the attribute was reallocated as a new string
 | |
|  * @normalize:  if 1 then further non-CDATA normalization must be done
 | |
|  *
 | |
|  * parse a value for an attribute.
 | |
|  * NOTE: if no normalization is needed, the routine will return pointers
 | |
|  *       directly from the data buffer.
 | |
|  *
 | |
|  * 3.3.3 Attribute-Value Normalization:
 | |
|  * Before the value of an attribute is passed to the application or
 | |
|  * checked for validity, the XML processor must normalize it as follows:
 | |
|  * - a character reference is processed by appending the referenced
 | |
|  *   character to the attribute value
 | |
|  * - an entity reference is processed by recursively processing the
 | |
|  *   replacement text of the entity
 | |
|  * - a whitespace character (#x20, #xD, #xA, #x9) is processed by
 | |
|  *   appending #x20 to the normalized value, except that only a single
 | |
|  *   #x20 is appended for a "#xD#xA" sequence that is part of an external
 | |
|  *   parsed entity or the literal entity value of an internal parsed entity
 | |
|  * - other characters are processed by appending them to the normalized value
 | |
|  * If the declared value is not CDATA, then the XML processor must further
 | |
|  * process the normalized attribute value by discarding any leading and
 | |
|  * trailing space (#x20) characters, and by replacing sequences of space
 | |
|  * (#x20) characters by a single space (#x20) character.
 | |
|  * All attributes for which no declaration has been read should be treated
 | |
|  * by a non-validating parser as if declared CDATA.
 | |
|  *
 | |
|  * Returns the AttValue parsed or NULL. The value has to be freed by the
 | |
|  *     caller if it was copied, this can be detected by val[*len] == 0.
 | |
|  */
 | |
| 
 | |
| #define GROW_PARSE_ATT_VALUE_INTERNAL(ctxt, in, start, end) \
 | |
|     const xmlChar *oldbase = ctxt->input->base;\
 | |
|     GROW;\
 | |
|     if (ctxt->instate == XML_PARSER_EOF)\
 | |
|         return(NULL);\
 | |
|     if (oldbase != ctxt->input->base) {\
 | |
|         ptrdiff_t delta = ctxt->input->base - oldbase;\
 | |
|         start = start + delta;\
 | |
|         in = in + delta;\
 | |
|     }\
 | |
|     end = ctxt->input->end;
 | |
| 
 | |
| static xmlChar *
 | |
| xmlParseAttValueInternal(xmlParserCtxtPtr ctxt, int *len, int *alloc,
 | |
|                          int normalize)
 | |
| {
 | |
|     xmlChar limit = 0;
 | |
|     const xmlChar *in = NULL, *start, *end, *last;
 | |
|     xmlChar *ret = NULL;
 | |
|     int line, col;
 | |
|     int maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                     XML_MAX_HUGE_LENGTH :
 | |
|                     XML_MAX_TEXT_LENGTH;
 | |
| 
 | |
|     GROW;
 | |
|     in = (xmlChar *) CUR_PTR;
 | |
|     line = ctxt->input->line;
 | |
|     col = ctxt->input->col;
 | |
|     if (*in != '"' && *in != '\'') {
 | |
|         xmlFatalErr(ctxt, XML_ERR_ATTRIBUTE_NOT_STARTED, NULL);
 | |
|         return (NULL);
 | |
|     }
 | |
|     ctxt->instate = XML_PARSER_ATTRIBUTE_VALUE;
 | |
| 
 | |
|     /*
 | |
|      * try to handle in this routine the most common case where no
 | |
|      * allocation of a new string is required and where content is
 | |
|      * pure ASCII.
 | |
|      */
 | |
|     limit = *in++;
 | |
|     col++;
 | |
|     end = ctxt->input->end;
 | |
|     start = in;
 | |
|     if (in >= end) {
 | |
|         GROW_PARSE_ATT_VALUE_INTERNAL(ctxt, in, start, end)
 | |
|     }
 | |
|     if (normalize) {
 | |
|         /*
 | |
| 	 * Skip any leading spaces
 | |
| 	 */
 | |
| 	while ((in < end) && (*in != limit) &&
 | |
| 	       ((*in == 0x20) || (*in == 0x9) ||
 | |
| 	        (*in == 0xA) || (*in == 0xD))) {
 | |
| 	    if (*in == 0xA) {
 | |
| 	        line++; col = 1;
 | |
| 	    } else {
 | |
| 	        col++;
 | |
| 	    }
 | |
| 	    in++;
 | |
| 	    start = in;
 | |
| 	    if (in >= end) {
 | |
|                 GROW_PARSE_ATT_VALUE_INTERNAL(ctxt, in, start, end)
 | |
|                 if ((in - start) > maxLength) {
 | |
|                     xmlFatalErrMsg(ctxt, XML_ERR_ATTRIBUTE_NOT_FINISHED,
 | |
|                                    "AttValue length too long\n");
 | |
|                     return(NULL);
 | |
|                 }
 | |
| 	    }
 | |
| 	}
 | |
| 	while ((in < end) && (*in != limit) && (*in >= 0x20) &&
 | |
| 	       (*in <= 0x7f) && (*in != '&') && (*in != '<')) {
 | |
| 	    col++;
 | |
| 	    if ((*in++ == 0x20) && (*in == 0x20)) break;
 | |
| 	    if (in >= end) {
 | |
|                 GROW_PARSE_ATT_VALUE_INTERNAL(ctxt, in, start, end)
 | |
|                 if ((in - start) > maxLength) {
 | |
|                     xmlFatalErrMsg(ctxt, XML_ERR_ATTRIBUTE_NOT_FINISHED,
 | |
|                                    "AttValue length too long\n");
 | |
|                     return(NULL);
 | |
|                 }
 | |
| 	    }
 | |
| 	}
 | |
| 	last = in;
 | |
| 	/*
 | |
| 	 * skip the trailing blanks
 | |
| 	 */
 | |
| 	while ((last[-1] == 0x20) && (last > start)) last--;
 | |
| 	while ((in < end) && (*in != limit) &&
 | |
| 	       ((*in == 0x20) || (*in == 0x9) ||
 | |
| 	        (*in == 0xA) || (*in == 0xD))) {
 | |
| 	    if (*in == 0xA) {
 | |
| 	        line++, col = 1;
 | |
| 	    } else {
 | |
| 	        col++;
 | |
| 	    }
 | |
| 	    in++;
 | |
| 	    if (in >= end) {
 | |
| 		const xmlChar *oldbase = ctxt->input->base;
 | |
| 		GROW;
 | |
|                 if (ctxt->instate == XML_PARSER_EOF)
 | |
|                     return(NULL);
 | |
| 		if (oldbase != ctxt->input->base) {
 | |
| 		    ptrdiff_t delta = ctxt->input->base - oldbase;
 | |
| 		    start = start + delta;
 | |
| 		    in = in + delta;
 | |
| 		    last = last + delta;
 | |
| 		}
 | |
| 		end = ctxt->input->end;
 | |
|                 if ((in - start) > maxLength) {
 | |
|                     xmlFatalErrMsg(ctxt, XML_ERR_ATTRIBUTE_NOT_FINISHED,
 | |
|                                    "AttValue length too long\n");
 | |
|                     return(NULL);
 | |
|                 }
 | |
| 	    }
 | |
| 	}
 | |
|         if ((in - start) > maxLength) {
 | |
|             xmlFatalErrMsg(ctxt, XML_ERR_ATTRIBUTE_NOT_FINISHED,
 | |
|                            "AttValue length too long\n");
 | |
|             return(NULL);
 | |
|         }
 | |
| 	if (*in != limit) goto need_complex;
 | |
|     } else {
 | |
| 	while ((in < end) && (*in != limit) && (*in >= 0x20) &&
 | |
| 	       (*in <= 0x7f) && (*in != '&') && (*in != '<')) {
 | |
| 	    in++;
 | |
| 	    col++;
 | |
| 	    if (in >= end) {
 | |
|                 GROW_PARSE_ATT_VALUE_INTERNAL(ctxt, in, start, end)
 | |
|                 if ((in - start) > maxLength) {
 | |
|                     xmlFatalErrMsg(ctxt, XML_ERR_ATTRIBUTE_NOT_FINISHED,
 | |
|                                    "AttValue length too long\n");
 | |
|                     return(NULL);
 | |
|                 }
 | |
| 	    }
 | |
| 	}
 | |
| 	last = in;
 | |
|         if ((in - start) > maxLength) {
 | |
|             xmlFatalErrMsg(ctxt, XML_ERR_ATTRIBUTE_NOT_FINISHED,
 | |
|                            "AttValue length too long\n");
 | |
|             return(NULL);
 | |
|         }
 | |
| 	if (*in != limit) goto need_complex;
 | |
|     }
 | |
|     in++;
 | |
|     col++;
 | |
|     if (len != NULL) {
 | |
|         if (alloc) *alloc = 0;
 | |
|         *len = last - start;
 | |
|         ret = (xmlChar *) start;
 | |
|     } else {
 | |
|         if (alloc) *alloc = 1;
 | |
|         ret = xmlStrndup(start, last - start);
 | |
|     }
 | |
|     CUR_PTR = in;
 | |
|     ctxt->input->line = line;
 | |
|     ctxt->input->col = col;
 | |
|     return ret;
 | |
| need_complex:
 | |
|     if (alloc) *alloc = 1;
 | |
|     return xmlParseAttValueComplex(ctxt, len, normalize);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseAttribute2:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @pref:  the element prefix
 | |
|  * @elem:  the element name
 | |
|  * @prefix:  a xmlChar ** used to store the value of the attribute prefix
 | |
|  * @value:  a xmlChar ** used to store the value of the attribute
 | |
|  * @len:  an int * to save the length of the attribute
 | |
|  * @alloc:  an int * to indicate if the attribute was allocated
 | |
|  *
 | |
|  * parse an attribute in the new SAX2 framework.
 | |
|  *
 | |
|  * Returns the attribute name, and the value in *value, .
 | |
|  */
 | |
| 
 | |
| static xmlHashedString
 | |
| xmlParseAttribute2(xmlParserCtxtPtr ctxt,
 | |
|                    const xmlChar * pref, const xmlChar * elem,
 | |
|                    xmlHashedString * hprefix, xmlChar ** value,
 | |
|                    int *len, int *alloc)
 | |
| {
 | |
|     xmlHashedString hname;
 | |
|     const xmlChar *prefix, *name;
 | |
|     xmlChar *val, *internal_val = NULL;
 | |
|     int normalize = 0;
 | |
| 
 | |
|     *value = NULL;
 | |
|     GROW;
 | |
|     hname = xmlParseQNameHashed(ctxt, hprefix);
 | |
|     if (hname.name == NULL) {
 | |
|         xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
|                        "error parsing attribute name\n");
 | |
|         return(hname);
 | |
|     }
 | |
|     name = hname.name;
 | |
|     if (hprefix->name != NULL)
 | |
|         prefix = hprefix->name;
 | |
|     else
 | |
|         prefix = NULL;
 | |
| 
 | |
|     /*
 | |
|      * get the type if needed
 | |
|      */
 | |
|     if (ctxt->attsSpecial != NULL) {
 | |
|         int type;
 | |
| 
 | |
|         type = (int) (ptrdiff_t) xmlHashQLookup2(ctxt->attsSpecial,
 | |
|                                                  pref, elem,
 | |
|                                                  prefix, name);
 | |
|         if (type != 0)
 | |
|             normalize = 1;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * read the value
 | |
|      */
 | |
|     SKIP_BLANKS;
 | |
|     if (RAW == '=') {
 | |
|         NEXT;
 | |
|         SKIP_BLANKS;
 | |
|         val = xmlParseAttValueInternal(ctxt, len, alloc, normalize);
 | |
|         if (val == NULL) {
 | |
|             hname.name = NULL;
 | |
|             return(hname);
 | |
|         }
 | |
| 	if (normalize) {
 | |
| 	    /*
 | |
| 	     * Sometimes a second normalisation pass for spaces is needed
 | |
| 	     * but that only happens if charrefs or entities references
 | |
| 	     * have been used in the attribute value, i.e. the attribute
 | |
| 	     * value have been extracted in an allocated string already.
 | |
| 	     */
 | |
| 	    if (*alloc) {
 | |
| 	        const xmlChar *val2;
 | |
| 
 | |
| 	        val2 = xmlAttrNormalizeSpace2(ctxt, val, len);
 | |
| 		if ((val2 != NULL) && (val2 != val)) {
 | |
| 		    xmlFree(val);
 | |
| 		    val = (xmlChar *) val2;
 | |
| 		}
 | |
| 	    }
 | |
| 	}
 | |
|         ctxt->instate = XML_PARSER_CONTENT;
 | |
|     } else {
 | |
|         xmlFatalErrMsgStr(ctxt, XML_ERR_ATTRIBUTE_WITHOUT_VALUE,
 | |
|                           "Specification mandates value for attribute %s\n",
 | |
|                           name);
 | |
|         return(hname);
 | |
|     }
 | |
| 
 | |
|     if (prefix == ctxt->str_xml) {
 | |
|         /*
 | |
|          * Check that xml:lang conforms to the specification
 | |
|          * No more registered as an error, just generate a warning now
 | |
|          * since this was deprecated in XML second edition
 | |
|          */
 | |
|         if ((ctxt->pedantic) && (xmlStrEqual(name, BAD_CAST "lang"))) {
 | |
|             internal_val = xmlStrndup(val, *len);
 | |
|             if (!xmlCheckLanguageID(internal_val)) {
 | |
|                 xmlWarningMsg(ctxt, XML_WAR_LANG_VALUE,
 | |
|                               "Malformed value for xml:lang : %s\n",
 | |
|                               internal_val, NULL);
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         /*
 | |
|          * Check that xml:space conforms to the specification
 | |
|          */
 | |
|         if (xmlStrEqual(name, BAD_CAST "space")) {
 | |
|             internal_val = xmlStrndup(val, *len);
 | |
|             if (xmlStrEqual(internal_val, BAD_CAST "default"))
 | |
|                 *(ctxt->space) = 0;
 | |
|             else if (xmlStrEqual(internal_val, BAD_CAST "preserve"))
 | |
|                 *(ctxt->space) = 1;
 | |
|             else {
 | |
|                 xmlWarningMsg(ctxt, XML_WAR_SPACE_VALUE,
 | |
|                               "Invalid value \"%s\" for xml:space : \"default\" or \"preserve\" expected\n",
 | |
|                               internal_val, NULL);
 | |
|             }
 | |
|         }
 | |
|         if (internal_val) {
 | |
|             xmlFree(internal_val);
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     *value = val;
 | |
|     return (hname);
 | |
| }
 | |
| 
 | |
| ATTRIBUTE_NO_SANITIZE_INTEGER
 | |
| static unsigned
 | |
| xmlCombineHash(unsigned v1, unsigned v2) {
 | |
|     return(HASH_ROL(v1, 15) ^ v2);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlAttrHashInsert:
 | |
|  * @ctxt: parser context
 | |
|  * @aindex: attribute index (this is a multiple of 5)
 | |
|  * @sizePtr: size of the hash table (input/output value)
 | |
|  * @name: attribute name
 | |
|  * @uri: namespace uri
 | |
|  * @hashValue: combined hash value of name and uri
 | |
|  *
 | |
|  * Inserts a new attribute into the hash table.
 | |
|  *
 | |
|  * Returns INT_MAX if no existing attribute was found, the attribute
 | |
|  * index if an attribute was found, -1 if a memory allocation failed.
 | |
|  */
 | |
| static int
 | |
| xmlAttrHashInsert(xmlParserCtxtPtr ctxt, int aindex, unsigned *sizePtr,
 | |
|                   const xmlChar *name, const xmlChar *uri,
 | |
|                   unsigned hashValue) {
 | |
|     xmlAttrHashBucket *table = ctxt->attrHash;
 | |
|     xmlAttrHashBucket *bucket;
 | |
|     unsigned hindex;
 | |
|     unsigned size = *sizePtr;
 | |
| 
 | |
|     if (size > 0) {
 | |
|         hindex = hashValue & (size - 1);
 | |
|         bucket = &table[hindex];
 | |
| 
 | |
|         while (bucket->hashValue != 0) {
 | |
|             const xmlChar **atts = &ctxt->atts[bucket->index];
 | |
| 
 | |
|             if (name == atts[0]) {
 | |
|                 int nsIndex = (int) (ptrdiff_t) atts[2];
 | |
| 
 | |
|                 if ((nsIndex == NS_INDEX_EMPTY) ? (uri == NULL) :
 | |
|                     (nsIndex == NS_INDEX_XML) ? (uri == ctxt->str_xml) :
 | |
|                     (uri == ctxt->nsTab[nsIndex * 2 + 1]))
 | |
|                     return(bucket->index);
 | |
|             }
 | |
| 
 | |
|             hindex++;
 | |
|             bucket++;
 | |
|             if (hindex >= size) {
 | |
|                 hindex = 0;
 | |
|                 bucket = table;
 | |
|             }
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Grow hash table
 | |
|      */
 | |
|     if ((unsigned) aindex / 5 >= size / 2) {
 | |
|         xmlAttrHashBucket *newTable;
 | |
|         unsigned newSize, i, nindex;
 | |
| 
 | |
|         newSize = size ? size * 2 : 8;
 | |
| 
 | |
|         if (newSize > ctxt->attrHashMax) {
 | |
|             newTable = xmlRealloc(table, newSize * sizeof(newTable[0]));
 | |
|             if (newTable == NULL) {
 | |
|                 xmlErrMemory(ctxt, NULL);
 | |
|                 return(-1);
 | |
|             }
 | |
| 
 | |
|             table = newTable;
 | |
|             ctxt->attrHash = newTable;
 | |
|             ctxt->attrHashMax = newSize;
 | |
|         }
 | |
| 
 | |
|         memset(&table[size], 0, (newSize - size) * sizeof(table[0]));
 | |
| 
 | |
|         if (size > 0) {
 | |
|             /*
 | |
|              * We must search for the start of a probe sequence to make
 | |
|              * in-place operation work.
 | |
|              */
 | |
|             hindex = 0;
 | |
|             bucket = table;
 | |
|             while (bucket->hashValue != 0) {
 | |
|                 hindex++;
 | |
|                 bucket++;
 | |
|             }
 | |
| 
 | |
|             for (i = 0; i < size; i++) {
 | |
|                 if (bucket->hashValue != 0) {
 | |
|                     nindex = bucket->hashValue & (newSize - 1);
 | |
| 
 | |
|                     while (nindex != hindex) {
 | |
|                         if (table[nindex].hashValue == 0) {
 | |
|                             table[nindex] = *bucket;
 | |
|                             bucket->hashValue = 0;
 | |
|                             break;
 | |
|                         }
 | |
| 
 | |
|                         nindex++;
 | |
|                         if (nindex >= newSize)
 | |
|                             nindex = 0;
 | |
|                     }
 | |
|                 }
 | |
| 
 | |
|                 hindex++;
 | |
|                 bucket++;
 | |
|                 if (hindex >= size) {
 | |
|                     hindex = 0;
 | |
|                     bucket = table;
 | |
|                 }
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         size = newSize;
 | |
|         *sizePtr = newSize;
 | |
| 
 | |
|         /*
 | |
|          * Relookup
 | |
|          */
 | |
|         hindex = hashValue & (size - 1);
 | |
|         bucket = &table[hindex];
 | |
| 
 | |
|         while (bucket->hashValue != 0) {
 | |
|             hindex++;
 | |
|             bucket++;
 | |
|             if (hindex >= size) {
 | |
|                 hindex = 0;
 | |
|                 bucket = table;
 | |
|             }
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     bucket->hashValue = hashValue;
 | |
|     bucket->index = aindex;
 | |
| 
 | |
|     return(INT_MAX);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseStartTag2:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * Parse a start tag. Always consumes '<'.
 | |
|  *
 | |
|  * This routine is called when running SAX2 parsing
 | |
|  *
 | |
|  * [40] STag ::= '<' Name (S Attribute)* S? '>'
 | |
|  *
 | |
|  * [ WFC: Unique Att Spec ]
 | |
|  * No attribute name may appear more than once in the same start-tag or
 | |
|  * empty-element tag.
 | |
|  *
 | |
|  * [44] EmptyElemTag ::= '<' Name (S Attribute)* S? '/>'
 | |
|  *
 | |
|  * [ WFC: Unique Att Spec ]
 | |
|  * No attribute name may appear more than once in the same start-tag or
 | |
|  * empty-element tag.
 | |
|  *
 | |
|  * With namespace:
 | |
|  *
 | |
|  * [NS 8] STag ::= '<' QName (S Attribute)* S? '>'
 | |
|  *
 | |
|  * [NS 10] EmptyElement ::= '<' QName (S Attribute)* S? '/>'
 | |
|  *
 | |
|  * Returns the element name parsed
 | |
|  */
 | |
| 
 | |
| static const xmlChar *
 | |
| xmlParseStartTag2(xmlParserCtxtPtr ctxt, const xmlChar **pref,
 | |
|                   const xmlChar **URI, int *nbNsPtr) {
 | |
|     xmlHashedString hlocalname;
 | |
|     xmlHashedString hprefix;
 | |
|     xmlHashedString hattname;
 | |
|     xmlHashedString haprefix;
 | |
|     const xmlChar *localname;
 | |
|     const xmlChar *prefix;
 | |
|     const xmlChar *attname;
 | |
|     const xmlChar *aprefix;
 | |
|     const xmlChar *uri;
 | |
|     xmlChar *attvalue = NULL;
 | |
|     const xmlChar **atts = ctxt->atts;
 | |
|     unsigned attrHashSize = 0;
 | |
|     int maxatts = ctxt->maxatts;
 | |
|     int nratts, nbatts, nbdef, inputid;
 | |
|     int i, j, nbNs, attval, nsIndex;
 | |
|     int alloc = 0;
 | |
| 
 | |
|     if (RAW != '<') return(NULL);
 | |
|     NEXT1;
 | |
| 
 | |
|     inputid = ctxt->input->id;
 | |
|     nbatts = 0;
 | |
|     nratts = 0;
 | |
|     nbdef = 0;
 | |
|     nbNs = 0;
 | |
|     attval = 0;
 | |
| 
 | |
|     if (xmlParserNsStartElement(ctxt->nsdb) < 0) {
 | |
|         xmlErrMemory(ctxt, NULL);
 | |
|         return(NULL);
 | |
|     }
 | |
| 
 | |
|     hlocalname = xmlParseQNameHashed(ctxt, &hprefix);
 | |
|     if (hlocalname.name == NULL) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_NAME_REQUIRED,
 | |
| 		       "StartTag: invalid element name\n");
 | |
|         return(NULL);
 | |
|     }
 | |
|     localname = hlocalname.name;
 | |
|     prefix = hprefix.name;
 | |
| 
 | |
|     /*
 | |
|      * Now parse the attributes, it ends up with the ending
 | |
|      *
 | |
|      * (S Attribute)* S?
 | |
|      */
 | |
|     SKIP_BLANKS;
 | |
|     GROW;
 | |
| 
 | |
|     /*
 | |
|      * The ctxt->atts array will be ultimately passed to the SAX callback
 | |
|      * containing five xmlChar pointers for each attribute:
 | |
|      *
 | |
|      * [0] attribute name
 | |
|      * [1] attribute prefix
 | |
|      * [2] namespace URI
 | |
|      * [3] attribute value
 | |
|      * [4] end of attribute value
 | |
|      *
 | |
|      * To save memory, we reuse this array temporarily and store integers
 | |
|      * in these pointer variables.
 | |
|      *
 | |
|      * [0] attribute name
 | |
|      * [1] attribute prefix
 | |
|      * [2] hash value of attribute prefix, and later namespace index
 | |
|      * [3] for non-allocated values: ptrdiff_t offset into input buffer
 | |
|      * [4] for non-allocated values: ptrdiff_t offset into input buffer
 | |
|      *
 | |
|      * The ctxt->attallocs array contains an additional unsigned int for
 | |
|      * each attribute, containing the hash value of the attribute name
 | |
|      * and the alloc flag in bit 31.
 | |
|      */
 | |
| 
 | |
|     while (((RAW != '>') &&
 | |
| 	   ((RAW != '/') || (NXT(1) != '>')) &&
 | |
| 	   (IS_BYTE_CHAR(RAW))) && (ctxt->instate != XML_PARSER_EOF)) {
 | |
| 	int len = -1;
 | |
| 
 | |
| 	hattname = xmlParseAttribute2(ctxt, prefix, localname,
 | |
|                                           &haprefix, &attvalue, &len,
 | |
|                                           &alloc);
 | |
|         if (hattname.name == NULL) {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
| 	         "xmlParseStartTag: problem parsing attributes\n");
 | |
| 	    break;
 | |
| 	}
 | |
|         if (attvalue == NULL)
 | |
|             goto next_attr;
 | |
|         attname = hattname.name;
 | |
|         aprefix = haprefix.name;
 | |
| 	if (len < 0) len = xmlStrlen(attvalue);
 | |
| 
 | |
|         if ((attname == ctxt->str_xmlns) && (aprefix == NULL)) {
 | |
|             xmlHashedString huri;
 | |
|             xmlURIPtr parsedUri;
 | |
| 
 | |
|             huri = xmlDictLookupHashed(ctxt->dict, attvalue, len);
 | |
|             uri = huri.name;
 | |
|             if (uri == NULL) {
 | |
|                 xmlErrMemory(ctxt, NULL);
 | |
|                 goto next_attr;
 | |
|             }
 | |
|             if (*uri != 0) {
 | |
|                 parsedUri = xmlParseURI((const char *) uri);
 | |
|                 if (parsedUri == NULL) {
 | |
|                     xmlNsErr(ctxt, XML_WAR_NS_URI,
 | |
|                              "xmlns: '%s' is not a valid URI\n",
 | |
|                                        uri, NULL, NULL);
 | |
|                 } else {
 | |
|                     if (parsedUri->scheme == NULL) {
 | |
|                         xmlNsWarn(ctxt, XML_WAR_NS_URI_RELATIVE,
 | |
|                                   "xmlns: URI %s is not absolute\n",
 | |
|                                   uri, NULL, NULL);
 | |
|                     }
 | |
|                     xmlFreeURI(parsedUri);
 | |
|                 }
 | |
|                 if (uri == ctxt->str_xml_ns) {
 | |
|                     if (attname != ctxt->str_xml) {
 | |
|                         xmlNsErr(ctxt, XML_NS_ERR_XML_NAMESPACE,
 | |
|                      "xml namespace URI cannot be the default namespace\n",
 | |
|                                  NULL, NULL, NULL);
 | |
|                     }
 | |
|                     goto next_attr;
 | |
|                 }
 | |
|                 if ((len == 29) &&
 | |
|                     (xmlStrEqual(uri,
 | |
|                              BAD_CAST "http://www.w3.org/2000/xmlns/"))) {
 | |
|                     xmlNsErr(ctxt, XML_NS_ERR_XML_NAMESPACE,
 | |
|                          "reuse of the xmlns namespace name is forbidden\n",
 | |
|                              NULL, NULL, NULL);
 | |
|                     goto next_attr;
 | |
|                 }
 | |
|             }
 | |
| 
 | |
|             if (xmlParserNsPush(ctxt, NULL, &huri, NULL, 0) > 0)
 | |
|                 nbNs++;
 | |
|         } else if (aprefix == ctxt->str_xmlns) {
 | |
|             xmlHashedString huri;
 | |
|             xmlURIPtr parsedUri;
 | |
| 
 | |
|             huri = xmlDictLookupHashed(ctxt->dict, attvalue, len);
 | |
|             uri = huri.name;
 | |
|             if (uri == NULL) {
 | |
|                 xmlErrMemory(ctxt, NULL);
 | |
|                 goto next_attr;
 | |
|             }
 | |
| 
 | |
|             if (attname == ctxt->str_xml) {
 | |
|                 if (uri != ctxt->str_xml_ns) {
 | |
|                     xmlNsErr(ctxt, XML_NS_ERR_XML_NAMESPACE,
 | |
|                              "xml namespace prefix mapped to wrong URI\n",
 | |
|                              NULL, NULL, NULL);
 | |
|                 }
 | |
|                 /*
 | |
|                  * Do not keep a namespace definition node
 | |
|                  */
 | |
|                 goto next_attr;
 | |
|             }
 | |
|             if (uri == ctxt->str_xml_ns) {
 | |
|                 if (attname != ctxt->str_xml) {
 | |
|                     xmlNsErr(ctxt, XML_NS_ERR_XML_NAMESPACE,
 | |
|                              "xml namespace URI mapped to wrong prefix\n",
 | |
|                              NULL, NULL, NULL);
 | |
|                 }
 | |
|                 goto next_attr;
 | |
|             }
 | |
|             if (attname == ctxt->str_xmlns) {
 | |
|                 xmlNsErr(ctxt, XML_NS_ERR_XML_NAMESPACE,
 | |
|                          "redefinition of the xmlns prefix is forbidden\n",
 | |
|                          NULL, NULL, NULL);
 | |
|                 goto next_attr;
 | |
|             }
 | |
|             if ((len == 29) &&
 | |
|                 (xmlStrEqual(uri,
 | |
|                              BAD_CAST "http://www.w3.org/2000/xmlns/"))) {
 | |
|                 xmlNsErr(ctxt, XML_NS_ERR_XML_NAMESPACE,
 | |
|                          "reuse of the xmlns namespace name is forbidden\n",
 | |
|                          NULL, NULL, NULL);
 | |
|                 goto next_attr;
 | |
|             }
 | |
|             if ((uri == NULL) || (uri[0] == 0)) {
 | |
|                 xmlNsErr(ctxt, XML_NS_ERR_XML_NAMESPACE,
 | |
|                          "xmlns:%s: Empty XML namespace is not allowed\n",
 | |
|                               attname, NULL, NULL);
 | |
|                 goto next_attr;
 | |
|             } else {
 | |
|                 parsedUri = xmlParseURI((const char *) uri);
 | |
|                 if (parsedUri == NULL) {
 | |
|                     xmlNsErr(ctxt, XML_WAR_NS_URI,
 | |
|                          "xmlns:%s: '%s' is not a valid URI\n",
 | |
|                                        attname, uri, NULL);
 | |
|                 } else {
 | |
|                     if ((ctxt->pedantic) && (parsedUri->scheme == NULL)) {
 | |
|                         xmlNsWarn(ctxt, XML_WAR_NS_URI_RELATIVE,
 | |
|                                   "xmlns:%s: URI %s is not absolute\n",
 | |
|                                   attname, uri, NULL);
 | |
|                     }
 | |
|                     xmlFreeURI(parsedUri);
 | |
|                 }
 | |
|             }
 | |
| 
 | |
|             if (xmlParserNsPush(ctxt, &hattname, &huri, NULL, 0) > 0)
 | |
|                 nbNs++;
 | |
|         } else {
 | |
|             /*
 | |
|              * Populate attributes array, see above for repurposing
 | |
|              * of xmlChar pointers.
 | |
|              */
 | |
|             if ((atts == NULL) || (nbatts + 5 > maxatts)) {
 | |
|                 if (xmlCtxtGrowAttrs(ctxt, nbatts + 5) < 0) {
 | |
|                     goto next_attr;
 | |
|                 }
 | |
|                 maxatts = ctxt->maxatts;
 | |
|                 atts = ctxt->atts;
 | |
|             }
 | |
|             ctxt->attallocs[nratts++] = (hattname.hashValue & 0x7FFFFFFF) |
 | |
|                                         ((unsigned) alloc << 31);
 | |
|             atts[nbatts++] = attname;
 | |
|             atts[nbatts++] = aprefix;
 | |
|             atts[nbatts++] = (const xmlChar *) (size_t) haprefix.hashValue;
 | |
|             if (alloc) {
 | |
|                 atts[nbatts++] = attvalue;
 | |
|                 attvalue += len;
 | |
|                 atts[nbatts++] = attvalue;
 | |
|             } else {
 | |
|                 /*
 | |
|                  * attvalue points into the input buffer which can be
 | |
|                  * reallocated. Store differences to input->base instead.
 | |
|                  * The pointers will be reconstructed later.
 | |
|                  */
 | |
|                 atts[nbatts++] = (void *) (attvalue - BASE_PTR);
 | |
|                 attvalue += len;
 | |
|                 atts[nbatts++] = (void *) (attvalue - BASE_PTR);
 | |
|             }
 | |
|             /*
 | |
|              * tag if some deallocation is needed
 | |
|              */
 | |
|             if (alloc != 0) attval = 1;
 | |
|             attvalue = NULL; /* moved into atts */
 | |
|         }
 | |
| 
 | |
| next_attr:
 | |
|         if ((attvalue != NULL) && (alloc != 0)) {
 | |
|             xmlFree(attvalue);
 | |
|             attvalue = NULL;
 | |
|         }
 | |
| 
 | |
| 	GROW
 | |
|         if (ctxt->instate == XML_PARSER_EOF)
 | |
|             break;
 | |
| 	if ((RAW == '>') || (((RAW == '/') && (NXT(1) == '>'))))
 | |
| 	    break;
 | |
| 	if (SKIP_BLANKS == 0) {
 | |
| 	    xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 			   "attributes construct error\n");
 | |
| 	    break;
 | |
| 	}
 | |
|         GROW;
 | |
|     }
 | |
| 
 | |
|     if (ctxt->input->id != inputid) {
 | |
|         xmlFatalErr(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
|                     "Unexpected change of input\n");
 | |
|         localname = NULL;
 | |
|         goto done;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Namespaces from default attributes
 | |
|      */
 | |
|     if (ctxt->attsDefault != NULL) {
 | |
|         xmlDefAttrsPtr defaults;
 | |
| 
 | |
| 	defaults = xmlHashLookup2(ctxt->attsDefault, localname, prefix);
 | |
| 	if (defaults != NULL) {
 | |
| 	    for (i = 0; i < defaults->nbAttrs; i++) {
 | |
|                 xmlDefAttr *attr = &defaults->attrs[i];
 | |
| 
 | |
| 	        attname = attr->name.name;
 | |
| 		aprefix = attr->prefix.name;
 | |
| 
 | |
| 		if ((attname == ctxt->str_xmlns) && (aprefix == NULL)) {
 | |
|                     xmlParserEntityCheck(ctxt, attr->expandedSize);
 | |
| 
 | |
|                     if (xmlParserNsPush(ctxt, NULL, &attr->value, NULL, 1) > 0)
 | |
|                         nbNs++;
 | |
| 		} else if (aprefix == ctxt->str_xmlns) {
 | |
|                     xmlParserEntityCheck(ctxt, attr->expandedSize);
 | |
| 
 | |
|                     if (xmlParserNsPush(ctxt, &attr->name, &attr->value,
 | |
|                                       NULL, 1) > 0)
 | |
|                         nbNs++;
 | |
| 		}
 | |
| 	    }
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Resolve attribute namespaces
 | |
|      */
 | |
|     for (i = 0; i < nbatts; i += 5) {
 | |
|         attname = atts[i];
 | |
|         aprefix = atts[i+1];
 | |
| 
 | |
|         /*
 | |
| 	* The default namespace does not apply to attribute names.
 | |
| 	*/
 | |
| 	if (aprefix == NULL) {
 | |
|             nsIndex = NS_INDEX_EMPTY;
 | |
|         } else if (aprefix == ctxt->str_xml) {
 | |
|             nsIndex = NS_INDEX_XML;
 | |
|         } else {
 | |
|             haprefix.name = aprefix;
 | |
|             haprefix.hashValue = (size_t) atts[i+2];
 | |
|             nsIndex = xmlParserNsLookup(ctxt, &haprefix, NULL);
 | |
| 	    if (nsIndex == INT_MAX) {
 | |
|                 xmlNsErr(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
 | |
| 		    "Namespace prefix %s for %s on %s is not defined\n",
 | |
| 		    aprefix, attname, localname);
 | |
|                 nsIndex = NS_INDEX_EMPTY;
 | |
|             }
 | |
|         }
 | |
| 
 | |
|         atts[i+2] = (const xmlChar *) (ptrdiff_t) nsIndex;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Verify that attribute names are unique.
 | |
|      */
 | |
|     for (i = 0, j = 0; j < nratts; i += 5, j++) {
 | |
|         const xmlChar *nsuri;
 | |
|         unsigned hashValue, nameHashValue, uriHashValue;
 | |
|         int res;
 | |
| 
 | |
|         attname = atts[i];
 | |
|         aprefix = atts[i+1];
 | |
|         nsIndex = (ptrdiff_t) atts[i+2];
 | |
|         /* Hash values always have bit 31 set, see dict.c */
 | |
|         nameHashValue = ctxt->attallocs[j] | 0x80000000;
 | |
| 
 | |
|         if (nsIndex == NS_INDEX_EMPTY) {
 | |
|             nsuri = NULL;
 | |
|             uriHashValue = URI_HASH_EMPTY;
 | |
|         } else if (nsIndex == NS_INDEX_XML) {
 | |
|             nsuri = ctxt->str_xml_ns;
 | |
|             uriHashValue = URI_HASH_XML;
 | |
|         } else {
 | |
|             nsuri = ctxt->nsTab[nsIndex * 2 + 1];
 | |
|             uriHashValue = ctxt->nsdb->extra[nsIndex].uriHashValue;
 | |
|         }
 | |
| 
 | |
|         hashValue = xmlCombineHash(nameHashValue, uriHashValue);
 | |
|         res = xmlAttrHashInsert(ctxt, i, &attrHashSize, attname, nsuri,
 | |
|                                 hashValue);
 | |
|         if (res < 0)
 | |
|             continue;
 | |
| 
 | |
| 	/*
 | |
| 	 * [ WFC: Unique Att Spec ]
 | |
| 	 * No attribute name may appear more than once in the same
 | |
| 	 * start-tag or empty-element tag.
 | |
| 	 * As extended by the Namespace in XML REC.
 | |
| 	 */
 | |
|         if (res < INT_MAX) {
 | |
|             if (aprefix == atts[res+1]) {
 | |
|                 xmlErrAttributeDup(ctxt, aprefix, attname);
 | |
|             } else {
 | |
|                 xmlNsErr(ctxt, XML_NS_ERR_ATTRIBUTE_REDEFINED,
 | |
|                          "Namespaced Attribute %s in '%s' redefined\n",
 | |
|                          attname, nsuri, NULL);
 | |
|             }
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Default attributes
 | |
|      */
 | |
|     if (ctxt->attsDefault != NULL) {
 | |
|         xmlDefAttrsPtr defaults;
 | |
| 
 | |
| 	defaults = xmlHashLookup2(ctxt->attsDefault, localname, prefix);
 | |
| 	if (defaults != NULL) {
 | |
| 	    for (i = 0; i < defaults->nbAttrs; i++) {
 | |
|                 xmlDefAttr *attr = &defaults->attrs[i];
 | |
|                 const xmlChar *nsuri;
 | |
|                 unsigned hashValue, uriHashValue;
 | |
|                 int res;
 | |
| 
 | |
| 	        attname = attr->name.name;
 | |
| 		aprefix = attr->prefix.name;
 | |
| 
 | |
| 		if ((attname == ctxt->str_xmlns) && (aprefix == NULL))
 | |
|                     continue;
 | |
| 		if (aprefix == ctxt->str_xmlns)
 | |
|                     continue;
 | |
| 
 | |
|                 if (aprefix == NULL) {
 | |
|                     nsIndex = NS_INDEX_EMPTY;
 | |
|                     nsuri = NULL;
 | |
|                     uriHashValue = URI_HASH_EMPTY;
 | |
|                 } if (aprefix == ctxt->str_xml) {
 | |
|                     nsIndex = NS_INDEX_XML;
 | |
|                     nsuri = ctxt->str_xml_ns;
 | |
|                     uriHashValue = URI_HASH_XML;
 | |
|                 } else if (aprefix != NULL) {
 | |
|                     nsIndex = xmlParserNsLookup(ctxt, &attr->prefix, NULL);
 | |
|                     if (nsIndex == INT_MAX) {
 | |
|                         xmlNsErr(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
 | |
|                                  "Namespace prefix %s for %s on %s is not "
 | |
|                                  "defined\n",
 | |
|                                  aprefix, attname, localname);
 | |
|                         nsIndex = NS_INDEX_EMPTY;
 | |
|                         nsuri = NULL;
 | |
|                         uriHashValue = URI_HASH_EMPTY;
 | |
|                     } else {
 | |
|                         nsuri = ctxt->nsTab[nsIndex * 2 + 1];
 | |
|                         uriHashValue = ctxt->nsdb->extra[nsIndex].uriHashValue;
 | |
|                     }
 | |
|                 }
 | |
| 
 | |
|                 /*
 | |
|                  * Check whether the attribute exists
 | |
|                  */
 | |
|                 hashValue = xmlCombineHash(attr->name.hashValue, uriHashValue);
 | |
|                 res = xmlAttrHashInsert(ctxt, nbatts, &attrHashSize, attname,
 | |
|                                         nsuri, hashValue);
 | |
|                 if (res < 0)
 | |
|                     continue;
 | |
|                 if (res < INT_MAX) {
 | |
|                     if (aprefix == atts[res+1])
 | |
|                         continue;
 | |
|                     xmlNsErr(ctxt, XML_NS_ERR_ATTRIBUTE_REDEFINED,
 | |
|                              "Namespaced Attribute %s in '%s' redefined\n",
 | |
|                              attname, nsuri, NULL);
 | |
|                 }
 | |
| 
 | |
|                 xmlParserEntityCheck(ctxt, attr->expandedSize);
 | |
| 
 | |
|                 if ((atts == NULL) || (nbatts + 5 > maxatts)) {
 | |
|                     if (xmlCtxtGrowAttrs(ctxt, nbatts + 5) < 0) {
 | |
|                         localname = NULL;
 | |
|                         goto done;
 | |
|                     }
 | |
|                     maxatts = ctxt->maxatts;
 | |
|                     atts = ctxt->atts;
 | |
|                 }
 | |
| 
 | |
|                 atts[nbatts++] = attname;
 | |
|                 atts[nbatts++] = aprefix;
 | |
|                 atts[nbatts++] = (const xmlChar *) (ptrdiff_t) nsIndex;
 | |
|                 atts[nbatts++] = attr->value.name;
 | |
|                 atts[nbatts++] = attr->valueEnd;
 | |
|                 if ((ctxt->standalone == 1) && (attr->external != 0)) {
 | |
|                     xmlValidityError(ctxt, XML_DTD_STANDALONE_DEFAULTED,
 | |
|                             "standalone: attribute %s on %s defaulted "
 | |
|                             "from external subset\n",
 | |
|                             attname, localname);
 | |
|                 }
 | |
|                 nbdef++;
 | |
| 	    }
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Reconstruct attribute pointers
 | |
|      */
 | |
|     for (i = 0, j = 0; i < nbatts; i += 5, j++) {
 | |
|         /* namespace URI */
 | |
|         nsIndex = (ptrdiff_t) atts[i+2];
 | |
|         if (nsIndex == INT_MAX)
 | |
|             atts[i+2] = NULL;
 | |
|         else if (nsIndex == INT_MAX - 1)
 | |
|             atts[i+2] = ctxt->str_xml_ns;
 | |
|         else
 | |
|             atts[i+2] = ctxt->nsTab[nsIndex * 2 + 1];
 | |
| 
 | |
|         if ((j < nratts) && (ctxt->attallocs[j] & 0x80000000) == 0) {
 | |
|             atts[i+3] = BASE_PTR + (ptrdiff_t) atts[i+3];  /* value */
 | |
|             atts[i+4] = BASE_PTR + (ptrdiff_t) atts[i+4];  /* valuend */
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     uri = xmlParserNsLookupUri(ctxt, &hprefix);
 | |
|     if ((prefix != NULL) && (uri == NULL)) {
 | |
| 	xmlNsErr(ctxt, XML_NS_ERR_UNDEFINED_NAMESPACE,
 | |
| 	         "Namespace prefix %s on %s is not defined\n",
 | |
| 		 prefix, localname, NULL);
 | |
|     }
 | |
|     *pref = prefix;
 | |
|     *URI = uri;
 | |
| 
 | |
|     /*
 | |
|      * SAX callback
 | |
|      */
 | |
|     if ((ctxt->sax != NULL) && (ctxt->sax->startElementNs != NULL) &&
 | |
| 	(!ctxt->disableSAX)) {
 | |
| 	if (nbNs > 0)
 | |
| 	    ctxt->sax->startElementNs(ctxt->userData, localname, prefix, uri,
 | |
|                           nbNs, ctxt->nsTab + 2 * (ctxt->nsNr - nbNs),
 | |
| 			  nbatts / 5, nbdef, atts);
 | |
| 	else
 | |
| 	    ctxt->sax->startElementNs(ctxt->userData, localname, prefix, uri,
 | |
|                           0, NULL, nbatts / 5, nbdef, atts);
 | |
|     }
 | |
| 
 | |
| done:
 | |
|     /*
 | |
|      * Free allocated attribute values
 | |
|      */
 | |
|     if (attval != 0) {
 | |
| 	for (i = 0, j = 0; j < nratts; i += 5, j++)
 | |
| 	    if (ctxt->attallocs[j] & 0x80000000)
 | |
| 	        xmlFree((xmlChar *) atts[i+3]);
 | |
|     }
 | |
| 
 | |
|     *nbNsPtr = nbNs;
 | |
|     return(localname);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseEndTag2:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @line:  line of the start tag
 | |
|  * @nsNr:  number of namespaces on the start tag
 | |
|  *
 | |
|  * Parse an end tag. Always consumes '</'.
 | |
|  *
 | |
|  * [42] ETag ::= '</' Name S? '>'
 | |
|  *
 | |
|  * With namespace
 | |
|  *
 | |
|  * [NS 9] ETag ::= '</' QName S? '>'
 | |
|  */
 | |
| 
 | |
| static void
 | |
| xmlParseEndTag2(xmlParserCtxtPtr ctxt, const xmlStartTag *tag) {
 | |
|     const xmlChar *name;
 | |
| 
 | |
|     GROW;
 | |
|     if ((RAW != '<') || (NXT(1) != '/')) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_LTSLASH_REQUIRED, NULL);
 | |
| 	return;
 | |
|     }
 | |
|     SKIP(2);
 | |
| 
 | |
|     if (tag->prefix == NULL)
 | |
|         name = xmlParseNameAndCompare(ctxt, ctxt->name);
 | |
|     else
 | |
|         name = xmlParseQNameAndCompare(ctxt, ctxt->name, tag->prefix);
 | |
| 
 | |
|     /*
 | |
|      * We should definitely be at the ending "S? '>'" part
 | |
|      */
 | |
|     GROW;
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return;
 | |
|     SKIP_BLANKS;
 | |
|     if ((!IS_BYTE_CHAR(RAW)) || (RAW != '>')) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_GT_REQUIRED, NULL);
 | |
|     } else
 | |
| 	NEXT1;
 | |
| 
 | |
|     /*
 | |
|      * [ WFC: Element Type Match ]
 | |
|      * The Name in an element's end-tag must match the element type in the
 | |
|      * start-tag.
 | |
|      *
 | |
|      */
 | |
|     if (name != (xmlChar*)1) {
 | |
|         if (name == NULL) name = BAD_CAST "unparsable";
 | |
|         xmlFatalErrMsgStrIntStr(ctxt, XML_ERR_TAG_NAME_MISMATCH,
 | |
| 		     "Opening and ending tag mismatch: %s line %d and %s\n",
 | |
| 		                ctxt->name, tag->line, name);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * SAX: End of Tag
 | |
|      */
 | |
|     if ((ctxt->sax != NULL) && (ctxt->sax->endElementNs != NULL) &&
 | |
| 	(!ctxt->disableSAX))
 | |
| 	ctxt->sax->endElementNs(ctxt->userData, ctxt->name, tag->prefix,
 | |
|                                 tag->URI);
 | |
| 
 | |
|     spacePop(ctxt);
 | |
|     if (tag->nsNr != 0)
 | |
| 	xmlParserNsPop(ctxt, tag->nsNr);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseCDSect:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * Parse escaped pure raw content. Always consumes '<!['.
 | |
|  *
 | |
|  * [18] CDSect ::= CDStart CData CDEnd
 | |
|  *
 | |
|  * [19] CDStart ::= '<![CDATA['
 | |
|  *
 | |
|  * [20] Data ::= (Char* - (Char* ']]>' Char*))
 | |
|  *
 | |
|  * [21] CDEnd ::= ']]>'
 | |
|  */
 | |
| void
 | |
| xmlParseCDSect(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar *buf = NULL;
 | |
|     int len = 0;
 | |
|     int size = XML_PARSER_BUFFER_SIZE;
 | |
|     int r, rl;
 | |
|     int	s, sl;
 | |
|     int cur, l;
 | |
|     int maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                     XML_MAX_HUGE_LENGTH :
 | |
|                     XML_MAX_TEXT_LENGTH;
 | |
| 
 | |
|     if ((CUR != '<') || (NXT(1) != '!') || (NXT(2) != '['))
 | |
|         return;
 | |
|     SKIP(3);
 | |
| 
 | |
|     if (!CMP6(CUR_PTR, 'C', 'D', 'A', 'T', 'A', '['))
 | |
|         return;
 | |
|     SKIP(6);
 | |
| 
 | |
|     ctxt->instate = XML_PARSER_CDATA_SECTION;
 | |
|     r = CUR_CHAR(rl);
 | |
|     if (!IS_CHAR(r)) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_CDATA_NOT_FINISHED, NULL);
 | |
|         goto out;
 | |
|     }
 | |
|     NEXTL(rl);
 | |
|     s = CUR_CHAR(sl);
 | |
|     if (!IS_CHAR(s)) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_CDATA_NOT_FINISHED, NULL);
 | |
|         goto out;
 | |
|     }
 | |
|     NEXTL(sl);
 | |
|     cur = CUR_CHAR(l);
 | |
|     buf = (xmlChar *) xmlMallocAtomic(size);
 | |
|     if (buf == NULL) {
 | |
| 	xmlErrMemory(ctxt, NULL);
 | |
|         goto out;
 | |
|     }
 | |
|     while (IS_CHAR(cur) &&
 | |
|            ((r != ']') || (s != ']') || (cur != '>'))) {
 | |
| 	if (len + 5 >= size) {
 | |
| 	    xmlChar *tmp;
 | |
| 
 | |
| 	    tmp = (xmlChar *) xmlRealloc(buf, size * 2);
 | |
| 	    if (tmp == NULL) {
 | |
| 		xmlErrMemory(ctxt, NULL);
 | |
|                 goto out;
 | |
| 	    }
 | |
| 	    buf = tmp;
 | |
| 	    size *= 2;
 | |
| 	}
 | |
| 	COPY_BUF(buf, len, r);
 | |
|         if (len > maxLength) {
 | |
|             xmlFatalErrMsg(ctxt, XML_ERR_CDATA_NOT_FINISHED,
 | |
|                            "CData section too big found\n");
 | |
|             goto out;
 | |
|         }
 | |
| 	r = s;
 | |
| 	rl = sl;
 | |
| 	s = cur;
 | |
| 	sl = l;
 | |
| 	NEXTL(l);
 | |
| 	cur = CUR_CHAR(l);
 | |
|     }
 | |
|     buf[len] = 0;
 | |
|     if (ctxt->instate == XML_PARSER_EOF) {
 | |
|         xmlFree(buf);
 | |
|         return;
 | |
|     }
 | |
|     if (cur != '>') {
 | |
| 	xmlFatalErrMsgStr(ctxt, XML_ERR_CDATA_NOT_FINISHED,
 | |
| 	                     "CData section not finished\n%.50s\n", buf);
 | |
|         goto out;
 | |
|     }
 | |
|     NEXTL(l);
 | |
| 
 | |
|     /*
 | |
|      * OK the buffer is to be consumed as cdata.
 | |
|      */
 | |
|     if ((ctxt->sax != NULL) && (!ctxt->disableSAX)) {
 | |
| 	if (ctxt->sax->cdataBlock != NULL)
 | |
| 	    ctxt->sax->cdataBlock(ctxt->userData, buf, len);
 | |
| 	else if (ctxt->sax->characters != NULL)
 | |
| 	    ctxt->sax->characters(ctxt->userData, buf, len);
 | |
|     }
 | |
| 
 | |
| out:
 | |
|     if (ctxt->instate != XML_PARSER_EOF)
 | |
|         ctxt->instate = XML_PARSER_CONTENT;
 | |
|     xmlFree(buf);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseContentInternal:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * Parse a content sequence. Stops at EOF or '</'. Leaves checking of
 | |
|  * unexpected EOF to the caller.
 | |
|  */
 | |
| 
 | |
| static void
 | |
| xmlParseContentInternal(xmlParserCtxtPtr ctxt) {
 | |
|     int nameNr = ctxt->nameNr;
 | |
| 
 | |
|     GROW;
 | |
|     while ((ctxt->input->cur < ctxt->input->end) &&
 | |
| 	   (ctxt->instate != XML_PARSER_EOF)) {
 | |
| 	const xmlChar *cur = ctxt->input->cur;
 | |
| 
 | |
| 	/*
 | |
| 	 * First case : a Processing Instruction.
 | |
| 	 */
 | |
| 	if ((*cur == '<') && (cur[1] == '?')) {
 | |
| 	    xmlParsePI(ctxt);
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * Second case : a CDSection
 | |
| 	 */
 | |
| 	/* 2.6.0 test was *cur not RAW */
 | |
| 	else if (CMP9(CUR_PTR, '<', '!', '[', 'C', 'D', 'A', 'T', 'A', '[')) {
 | |
| 	    xmlParseCDSect(ctxt);
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * Third case :  a comment
 | |
| 	 */
 | |
| 	else if ((*cur == '<') && (NXT(1) == '!') &&
 | |
| 		 (NXT(2) == '-') && (NXT(3) == '-')) {
 | |
| 	    xmlParseComment(ctxt);
 | |
| 	    ctxt->instate = XML_PARSER_CONTENT;
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * Fourth case :  a sub-element.
 | |
| 	 */
 | |
| 	else if (*cur == '<') {
 | |
|             if (NXT(1) == '/') {
 | |
|                 if (ctxt->nameNr <= nameNr)
 | |
|                     break;
 | |
| 	        xmlParseElementEnd(ctxt);
 | |
|             } else {
 | |
| 	        xmlParseElementStart(ctxt);
 | |
|             }
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * Fifth case : a reference. If if has not been resolved,
 | |
| 	 *    parsing returns it's Name, create the node
 | |
| 	 */
 | |
| 
 | |
| 	else if (*cur == '&') {
 | |
| 	    xmlParseReference(ctxt);
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * Last case, text. Note that References are handled directly.
 | |
| 	 */
 | |
| 	else {
 | |
| 	    xmlParseCharDataInternal(ctxt, 0);
 | |
| 	}
 | |
| 
 | |
| 	SHRINK;
 | |
| 	GROW;
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseContent:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * Parse a content sequence. Stops at EOF or '</'.
 | |
|  *
 | |
|  * [43] content ::= (element | CharData | Reference | CDSect | PI | Comment)*
 | |
|  */
 | |
| 
 | |
| void
 | |
| xmlParseContent(xmlParserCtxtPtr ctxt) {
 | |
|     int nameNr = ctxt->nameNr;
 | |
| 
 | |
|     xmlParseContentInternal(ctxt);
 | |
| 
 | |
|     if ((ctxt->instate != XML_PARSER_EOF) &&
 | |
|         (ctxt->errNo == XML_ERR_OK) &&
 | |
|         (ctxt->nameNr > nameNr)) {
 | |
|         const xmlChar *name = ctxt->nameTab[ctxt->nameNr - 1];
 | |
|         int line = ctxt->pushTab[ctxt->nameNr - 1].line;
 | |
|         xmlFatalErrMsgStrIntStr(ctxt, XML_ERR_TAG_NOT_FINISHED,
 | |
|                 "Premature end of data in tag %s line %d\n",
 | |
| 		name, line, NULL);
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseElement:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an XML element
 | |
|  *
 | |
|  * [39] element ::= EmptyElemTag | STag content ETag
 | |
|  *
 | |
|  * [ WFC: Element Type Match ]
 | |
|  * The Name in an element's end-tag must match the element type in the
 | |
|  * start-tag.
 | |
|  *
 | |
|  */
 | |
| 
 | |
| void
 | |
| xmlParseElement(xmlParserCtxtPtr ctxt) {
 | |
|     if (xmlParseElementStart(ctxt) != 0)
 | |
|         return;
 | |
| 
 | |
|     xmlParseContentInternal(ctxt);
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
| 	return;
 | |
| 
 | |
|     if (ctxt->input->cur >= ctxt->input->end) {
 | |
|         if (ctxt->errNo == XML_ERR_OK) {
 | |
|             const xmlChar *name = ctxt->nameTab[ctxt->nameNr - 1];
 | |
|             int line = ctxt->pushTab[ctxt->nameNr - 1].line;
 | |
|             xmlFatalErrMsgStrIntStr(ctxt, XML_ERR_TAG_NOT_FINISHED,
 | |
|                     "Premature end of data in tag %s line %d\n",
 | |
|                     name, line, NULL);
 | |
|         }
 | |
|         return;
 | |
|     }
 | |
| 
 | |
|     xmlParseElementEnd(ctxt);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseElementStart:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * Parse the start of an XML element. Returns -1 in case of error, 0 if an
 | |
|  * opening tag was parsed, 1 if an empty element was parsed.
 | |
|  *
 | |
|  * Always consumes '<'.
 | |
|  */
 | |
| static int
 | |
| xmlParseElementStart(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *name;
 | |
|     const xmlChar *prefix = NULL;
 | |
|     const xmlChar *URI = NULL;
 | |
|     xmlParserNodeInfo node_info;
 | |
|     int line;
 | |
|     xmlNodePtr cur;
 | |
|     int nbNs = 0;
 | |
| 
 | |
|     if (((unsigned int) ctxt->nameNr > xmlParserMaxDepth) &&
 | |
|         ((ctxt->options & XML_PARSE_HUGE) == 0)) {
 | |
| 	xmlFatalErrMsgInt(ctxt, XML_ERR_INTERNAL_ERROR,
 | |
| 		 "Excessive depth in document: %d use XML_PARSE_HUGE option\n",
 | |
| 			  xmlParserMaxDepth);
 | |
| 	xmlHaltParser(ctxt);
 | |
| 	return(-1);
 | |
|     }
 | |
| 
 | |
|     /* Capture start position */
 | |
|     if (ctxt->record_info) {
 | |
|         node_info.begin_pos = ctxt->input->consumed +
 | |
|                           (CUR_PTR - ctxt->input->base);
 | |
| 	node_info.begin_line = ctxt->input->line;
 | |
|     }
 | |
| 
 | |
|     if (ctxt->spaceNr == 0)
 | |
| 	spacePush(ctxt, -1);
 | |
|     else if (*ctxt->space == -2)
 | |
| 	spacePush(ctxt, -1);
 | |
|     else
 | |
| 	spacePush(ctxt, *ctxt->space);
 | |
| 
 | |
|     line = ctxt->input->line;
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
|     if (ctxt->sax2)
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
|         name = xmlParseStartTag2(ctxt, &prefix, &URI, &nbNs);
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
|     else
 | |
| 	name = xmlParseStartTag(ctxt);
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
| 	return(-1);
 | |
|     if (name == NULL) {
 | |
| 	spacePop(ctxt);
 | |
|         return(-1);
 | |
|     }
 | |
|     nameNsPush(ctxt, name, prefix, URI, line, nbNs);
 | |
|     cur = ctxt->node;
 | |
| 
 | |
| #ifdef LIBXML_VALID_ENABLED
 | |
|     /*
 | |
|      * [ VC: Root Element Type ]
 | |
|      * The Name in the document type declaration must match the element
 | |
|      * type of the root element.
 | |
|      */
 | |
|     if (ctxt->validate && ctxt->wellFormed && ctxt->myDoc &&
 | |
|         ctxt->node && (ctxt->node == ctxt->myDoc->children))
 | |
|         ctxt->valid &= xmlValidateRoot(&ctxt->vctxt, ctxt->myDoc);
 | |
| #endif /* LIBXML_VALID_ENABLED */
 | |
| 
 | |
|     /*
 | |
|      * Check for an Empty Element.
 | |
|      */
 | |
|     if ((RAW == '/') && (NXT(1) == '>')) {
 | |
|         SKIP(2);
 | |
| 	if (ctxt->sax2) {
 | |
| 	    if ((ctxt->sax != NULL) && (ctxt->sax->endElementNs != NULL) &&
 | |
| 		(!ctxt->disableSAX))
 | |
| 		ctxt->sax->endElementNs(ctxt->userData, name, prefix, URI);
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
| 	} else {
 | |
| 	    if ((ctxt->sax != NULL) && (ctxt->sax->endElement != NULL) &&
 | |
| 		(!ctxt->disableSAX))
 | |
| 		ctxt->sax->endElement(ctxt->userData, name);
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
| 	}
 | |
| 	namePop(ctxt);
 | |
| 	spacePop(ctxt);
 | |
| 	if (nbNs > 0)
 | |
| 	    xmlParserNsPop(ctxt, nbNs);
 | |
| 	if (cur != NULL && ctxt->record_info) {
 | |
|             node_info.node = cur;
 | |
|             node_info.end_pos = ctxt->input->consumed +
 | |
|                                 (CUR_PTR - ctxt->input->base);
 | |
|             node_info.end_line = ctxt->input->line;
 | |
|             xmlParserAddNodeInfo(ctxt, &node_info);
 | |
| 	}
 | |
| 	return(1);
 | |
|     }
 | |
|     if (RAW == '>') {
 | |
|         NEXT1;
 | |
|         if (cur != NULL && ctxt->record_info) {
 | |
|             node_info.node = cur;
 | |
|             node_info.end_pos = 0;
 | |
|             node_info.end_line = 0;
 | |
|             xmlParserAddNodeInfo(ctxt, &node_info);
 | |
|         }
 | |
|     } else {
 | |
|         xmlFatalErrMsgStrIntStr(ctxt, XML_ERR_GT_REQUIRED,
 | |
| 		     "Couldn't find end of Start Tag %s line %d\n",
 | |
| 		                name, line, NULL);
 | |
| 
 | |
| 	/*
 | |
| 	 * end of parsing of this node.
 | |
| 	 */
 | |
| 	nodePop(ctxt);
 | |
| 	namePop(ctxt);
 | |
| 	spacePop(ctxt);
 | |
| 	if (nbNs > 0)
 | |
| 	    xmlParserNsPop(ctxt, nbNs);
 | |
| 	return(-1);
 | |
|     }
 | |
| 
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseElementEnd:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * Parse the end of an XML element. Always consumes '</'.
 | |
|  */
 | |
| static void
 | |
| xmlParseElementEnd(xmlParserCtxtPtr ctxt) {
 | |
|     xmlNodePtr cur = ctxt->node;
 | |
| 
 | |
|     if (ctxt->nameNr <= 0) {
 | |
|         if ((RAW == '<') && (NXT(1) == '/'))
 | |
|             SKIP(2);
 | |
|         return;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * parse the end of tag: '</' should be here.
 | |
|      */
 | |
|     if (ctxt->sax2) {
 | |
| 	xmlParseEndTag2(ctxt, &ctxt->pushTab[ctxt->nameNr - 1]);
 | |
| 	namePop(ctxt);
 | |
|     }
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
|     else
 | |
| 	xmlParseEndTag1(ctxt, 0);
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
| 
 | |
|     /*
 | |
|      * Capture end position
 | |
|      */
 | |
|     if (cur != NULL && ctxt->record_info) {
 | |
|         xmlParserNodeInfoPtr node_info;
 | |
| 
 | |
|         node_info = (xmlParserNodeInfoPtr) xmlParserFindNodeInfo(ctxt, cur);
 | |
|         if (node_info != NULL) {
 | |
|             node_info->end_pos = ctxt->input->consumed +
 | |
|                                  (CUR_PTR - ctxt->input->base);
 | |
|             node_info->end_line = ctxt->input->line;
 | |
|         }
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseVersionNum:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse the XML version value.
 | |
|  *
 | |
|  * [26] VersionNum ::= '1.' [0-9]+
 | |
|  *
 | |
|  * In practice allow [0-9].[0-9]+ at that level
 | |
|  *
 | |
|  * Returns the string giving the XML version number, or NULL
 | |
|  */
 | |
| xmlChar *
 | |
| xmlParseVersionNum(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar *buf = NULL;
 | |
|     int len = 0;
 | |
|     int size = 10;
 | |
|     xmlChar cur;
 | |
| 
 | |
|     buf = (xmlChar *) xmlMallocAtomic(size);
 | |
|     if (buf == NULL) {
 | |
| 	xmlErrMemory(ctxt, NULL);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     cur = CUR;
 | |
|     if (!((cur >= '0') && (cur <= '9'))) {
 | |
| 	xmlFree(buf);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     buf[len++] = cur;
 | |
|     NEXT;
 | |
|     cur=CUR;
 | |
|     if (cur != '.') {
 | |
| 	xmlFree(buf);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     buf[len++] = cur;
 | |
|     NEXT;
 | |
|     cur=CUR;
 | |
|     while ((cur >= '0') && (cur <= '9')) {
 | |
| 	if (len + 1 >= size) {
 | |
| 	    xmlChar *tmp;
 | |
| 
 | |
| 	    size *= 2;
 | |
| 	    tmp = (xmlChar *) xmlRealloc(buf, size);
 | |
| 	    if (tmp == NULL) {
 | |
| 	        xmlFree(buf);
 | |
| 		xmlErrMemory(ctxt, NULL);
 | |
| 		return(NULL);
 | |
| 	    }
 | |
| 	    buf = tmp;
 | |
| 	}
 | |
| 	buf[len++] = cur;
 | |
| 	NEXT;
 | |
| 	cur=CUR;
 | |
|     }
 | |
|     buf[len] = 0;
 | |
|     return(buf);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseVersionInfo:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse the XML version.
 | |
|  *
 | |
|  * [24] VersionInfo ::= S 'version' Eq (' VersionNum ' | " VersionNum ")
 | |
|  *
 | |
|  * [25] Eq ::= S? '=' S?
 | |
|  *
 | |
|  * Returns the version string, e.g. "1.0"
 | |
|  */
 | |
| 
 | |
| xmlChar *
 | |
| xmlParseVersionInfo(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar *version = NULL;
 | |
| 
 | |
|     if (CMP7(CUR_PTR, 'v', 'e', 'r', 's', 'i', 'o', 'n')) {
 | |
| 	SKIP(7);
 | |
| 	SKIP_BLANKS;
 | |
| 	if (RAW != '=') {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_EQUAL_REQUIRED, NULL);
 | |
| 	    return(NULL);
 | |
|         }
 | |
| 	NEXT;
 | |
| 	SKIP_BLANKS;
 | |
| 	if (RAW == '"') {
 | |
| 	    NEXT;
 | |
| 	    version = xmlParseVersionNum(ctxt);
 | |
| 	    if (RAW != '"') {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_STRING_NOT_CLOSED, NULL);
 | |
| 	    } else
 | |
| 	        NEXT;
 | |
| 	} else if (RAW == '\''){
 | |
| 	    NEXT;
 | |
| 	    version = xmlParseVersionNum(ctxt);
 | |
| 	    if (RAW != '\'') {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_STRING_NOT_CLOSED, NULL);
 | |
| 	    } else
 | |
| 	        NEXT;
 | |
| 	} else {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_STRING_NOT_STARTED, NULL);
 | |
| 	}
 | |
|     }
 | |
|     return(version);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseEncName:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse the XML encoding name
 | |
|  *
 | |
|  * [81] EncName ::= [A-Za-z] ([A-Za-z0-9._] | '-')*
 | |
|  *
 | |
|  * Returns the encoding name value or NULL
 | |
|  */
 | |
| xmlChar *
 | |
| xmlParseEncName(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar *buf = NULL;
 | |
|     int len = 0;
 | |
|     int size = 10;
 | |
|     int maxLength = (ctxt->options & XML_PARSE_HUGE) ?
 | |
|                     XML_MAX_TEXT_LENGTH :
 | |
|                     XML_MAX_NAME_LENGTH;
 | |
|     xmlChar cur;
 | |
| 
 | |
|     cur = CUR;
 | |
|     if (((cur >= 'a') && (cur <= 'z')) ||
 | |
|         ((cur >= 'A') && (cur <= 'Z'))) {
 | |
| 	buf = (xmlChar *) xmlMallocAtomic(size);
 | |
| 	if (buf == NULL) {
 | |
| 	    xmlErrMemory(ctxt, NULL);
 | |
| 	    return(NULL);
 | |
| 	}
 | |
| 
 | |
| 	buf[len++] = cur;
 | |
| 	NEXT;
 | |
| 	cur = CUR;
 | |
| 	while (((cur >= 'a') && (cur <= 'z')) ||
 | |
| 	       ((cur >= 'A') && (cur <= 'Z')) ||
 | |
| 	       ((cur >= '0') && (cur <= '9')) ||
 | |
| 	       (cur == '.') || (cur == '_') ||
 | |
| 	       (cur == '-')) {
 | |
| 	    if (len + 1 >= size) {
 | |
| 	        xmlChar *tmp;
 | |
| 
 | |
| 		size *= 2;
 | |
| 		tmp = (xmlChar *) xmlRealloc(buf, size);
 | |
| 		if (tmp == NULL) {
 | |
| 		    xmlErrMemory(ctxt, NULL);
 | |
| 		    xmlFree(buf);
 | |
| 		    return(NULL);
 | |
| 		}
 | |
| 		buf = tmp;
 | |
| 	    }
 | |
| 	    buf[len++] = cur;
 | |
|             if (len > maxLength) {
 | |
|                 xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "EncName");
 | |
|                 xmlFree(buf);
 | |
|                 return(NULL);
 | |
|             }
 | |
| 	    NEXT;
 | |
| 	    cur = CUR;
 | |
|         }
 | |
| 	buf[len] = 0;
 | |
|     } else {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_ENCODING_NAME, NULL);
 | |
|     }
 | |
|     return(buf);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseEncodingDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse the XML encoding declaration
 | |
|  *
 | |
|  * [80] EncodingDecl ::= S 'encoding' Eq ('"' EncName '"' |  "'" EncName "'")
 | |
|  *
 | |
|  * this setups the conversion filters.
 | |
|  *
 | |
|  * Returns the encoding value or NULL
 | |
|  */
 | |
| 
 | |
| const xmlChar *
 | |
| xmlParseEncodingDecl(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar *encoding = NULL;
 | |
| 
 | |
|     SKIP_BLANKS;
 | |
|     if (CMP8(CUR_PTR, 'e', 'n', 'c', 'o', 'd', 'i', 'n', 'g') == 0)
 | |
|         return(NULL);
 | |
| 
 | |
|     SKIP(8);
 | |
|     SKIP_BLANKS;
 | |
|     if (RAW != '=') {
 | |
|         xmlFatalErr(ctxt, XML_ERR_EQUAL_REQUIRED, NULL);
 | |
|         return(NULL);
 | |
|     }
 | |
|     NEXT;
 | |
|     SKIP_BLANKS;
 | |
|     if (RAW == '"') {
 | |
|         NEXT;
 | |
|         encoding = xmlParseEncName(ctxt);
 | |
|         if (RAW != '"') {
 | |
|             xmlFatalErr(ctxt, XML_ERR_STRING_NOT_CLOSED, NULL);
 | |
|             xmlFree((xmlChar *) encoding);
 | |
|             return(NULL);
 | |
|         } else
 | |
|             NEXT;
 | |
|     } else if (RAW == '\''){
 | |
|         NEXT;
 | |
|         encoding = xmlParseEncName(ctxt);
 | |
|         if (RAW != '\'') {
 | |
|             xmlFatalErr(ctxt, XML_ERR_STRING_NOT_CLOSED, NULL);
 | |
|             xmlFree((xmlChar *) encoding);
 | |
|             return(NULL);
 | |
|         } else
 | |
|             NEXT;
 | |
|     } else {
 | |
|         xmlFatalErr(ctxt, XML_ERR_STRING_NOT_STARTED, NULL);
 | |
|     }
 | |
| 
 | |
|     if (encoding == NULL)
 | |
|         return(NULL);
 | |
| 
 | |
|     xmlSetDeclaredEncoding(ctxt, encoding);
 | |
| 
 | |
|     return(ctxt->encoding);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseSDDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse the XML standalone declaration
 | |
|  *
 | |
|  * [32] SDDecl ::= S 'standalone' Eq
 | |
|  *                 (("'" ('yes' | 'no') "'") | ('"' ('yes' | 'no')'"'))
 | |
|  *
 | |
|  * [ VC: Standalone Document Declaration ]
 | |
|  * TODO The standalone document declaration must have the value "no"
 | |
|  * if any external markup declarations contain declarations of:
 | |
|  *  - attributes with default values, if elements to which these
 | |
|  *    attributes apply appear in the document without specifications
 | |
|  *    of values for these attributes, or
 | |
|  *  - entities (other than amp, lt, gt, apos, quot), if references
 | |
|  *    to those entities appear in the document, or
 | |
|  *  - attributes with values subject to normalization, where the
 | |
|  *    attribute appears in the document with a value which will change
 | |
|  *    as a result of normalization, or
 | |
|  *  - element types with element content, if white space occurs directly
 | |
|  *    within any instance of those types.
 | |
|  *
 | |
|  * Returns:
 | |
|  *   1 if standalone="yes"
 | |
|  *   0 if standalone="no"
 | |
|  *  -2 if standalone attribute is missing or invalid
 | |
|  *	  (A standalone value of -2 means that the XML declaration was found,
 | |
|  *	   but no value was specified for the standalone attribute).
 | |
|  */
 | |
| 
 | |
| int
 | |
| xmlParseSDDecl(xmlParserCtxtPtr ctxt) {
 | |
|     int standalone = -2;
 | |
| 
 | |
|     SKIP_BLANKS;
 | |
|     if (CMP10(CUR_PTR, 's', 't', 'a', 'n', 'd', 'a', 'l', 'o', 'n', 'e')) {
 | |
| 	SKIP(10);
 | |
|         SKIP_BLANKS;
 | |
| 	if (RAW != '=') {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_EQUAL_REQUIRED, NULL);
 | |
| 	    return(standalone);
 | |
|         }
 | |
| 	NEXT;
 | |
| 	SKIP_BLANKS;
 | |
|         if (RAW == '\''){
 | |
| 	    NEXT;
 | |
| 	    if ((RAW == 'n') && (NXT(1) == 'o')) {
 | |
| 	        standalone = 0;
 | |
|                 SKIP(2);
 | |
| 	    } else if ((RAW == 'y') && (NXT(1) == 'e') &&
 | |
| 	               (NXT(2) == 's')) {
 | |
| 	        standalone = 1;
 | |
| 		SKIP(3);
 | |
|             } else {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_STANDALONE_VALUE, NULL);
 | |
| 	    }
 | |
| 	    if (RAW != '\'') {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_STRING_NOT_CLOSED, NULL);
 | |
| 	    } else
 | |
| 	        NEXT;
 | |
| 	} else if (RAW == '"'){
 | |
| 	    NEXT;
 | |
| 	    if ((RAW == 'n') && (NXT(1) == 'o')) {
 | |
| 	        standalone = 0;
 | |
| 		SKIP(2);
 | |
| 	    } else if ((RAW == 'y') && (NXT(1) == 'e') &&
 | |
| 	               (NXT(2) == 's')) {
 | |
| 	        standalone = 1;
 | |
|                 SKIP(3);
 | |
|             } else {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_STANDALONE_VALUE, NULL);
 | |
| 	    }
 | |
| 	    if (RAW != '"') {
 | |
| 		xmlFatalErr(ctxt, XML_ERR_STRING_NOT_CLOSED, NULL);
 | |
| 	    } else
 | |
| 	        NEXT;
 | |
| 	} else {
 | |
| 	    xmlFatalErr(ctxt, XML_ERR_STRING_NOT_STARTED, NULL);
 | |
|         }
 | |
|     }
 | |
|     return(standalone);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseXMLDecl:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an XML declaration header
 | |
|  *
 | |
|  * [23] XMLDecl ::= '<?xml' VersionInfo EncodingDecl? SDDecl? S? '?>'
 | |
|  */
 | |
| 
 | |
| void
 | |
| xmlParseXMLDecl(xmlParserCtxtPtr ctxt) {
 | |
|     xmlChar *version;
 | |
| 
 | |
|     /*
 | |
|      * This value for standalone indicates that the document has an
 | |
|      * XML declaration but it does not have a standalone attribute.
 | |
|      * It will be overwritten later if a standalone attribute is found.
 | |
|      */
 | |
| 
 | |
|     ctxt->standalone = -2;
 | |
| 
 | |
|     /*
 | |
|      * We know that '<?xml' is here.
 | |
|      */
 | |
|     SKIP(5);
 | |
| 
 | |
|     if (!IS_BLANK_CH(RAW)) {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED,
 | |
| 	               "Blank needed after '<?xml'\n");
 | |
|     }
 | |
|     SKIP_BLANKS;
 | |
| 
 | |
|     /*
 | |
|      * We must have the VersionInfo here.
 | |
|      */
 | |
|     version = xmlParseVersionInfo(ctxt);
 | |
|     if (version == NULL) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_VERSION_MISSING, NULL);
 | |
|     } else {
 | |
| 	if (!xmlStrEqual(version, (const xmlChar *) XML_DEFAULT_VERSION)) {
 | |
| 	    /*
 | |
| 	     * Changed here for XML-1.0 5th edition
 | |
| 	     */
 | |
| 	    if (ctxt->options & XML_PARSE_OLD10) {
 | |
| 		xmlFatalErrMsgStr(ctxt, XML_ERR_UNKNOWN_VERSION,
 | |
| 			          "Unsupported version '%s'\n",
 | |
| 			          version);
 | |
| 	    } else {
 | |
| 	        if ((version[0] == '1') && ((version[1] == '.'))) {
 | |
| 		    xmlWarningMsg(ctxt, XML_WAR_UNKNOWN_VERSION,
 | |
| 		                  "Unsupported version '%s'\n",
 | |
| 				  version, NULL);
 | |
| 		} else {
 | |
| 		    xmlFatalErrMsgStr(ctxt, XML_ERR_UNKNOWN_VERSION,
 | |
| 				      "Unsupported version '%s'\n",
 | |
| 				      version);
 | |
| 		}
 | |
| 	    }
 | |
| 	}
 | |
| 	if (ctxt->version != NULL)
 | |
| 	    xmlFree((void *) ctxt->version);
 | |
| 	ctxt->version = version;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * We may have the encoding declaration
 | |
|      */
 | |
|     if (!IS_BLANK_CH(RAW)) {
 | |
|         if ((RAW == '?') && (NXT(1) == '>')) {
 | |
| 	    SKIP(2);
 | |
| 	    return;
 | |
| 	}
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED, "Blank needed here\n");
 | |
|     }
 | |
|     xmlParseEncodingDecl(ctxt);
 | |
|     if ((ctxt->errNo == XML_ERR_UNSUPPORTED_ENCODING) ||
 | |
|          (ctxt->instate == XML_PARSER_EOF)) {
 | |
| 	/*
 | |
| 	 * The XML REC instructs us to stop parsing right here
 | |
| 	 */
 | |
|         return;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * We may have the standalone status.
 | |
|      */
 | |
|     if ((ctxt->encoding != NULL) && (!IS_BLANK_CH(RAW))) {
 | |
|         if ((RAW == '?') && (NXT(1) == '>')) {
 | |
| 	    SKIP(2);
 | |
| 	    return;
 | |
| 	}
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED, "Blank needed here\n");
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * We can grow the input buffer freely at that point
 | |
|      */
 | |
|     GROW;
 | |
| 
 | |
|     SKIP_BLANKS;
 | |
|     ctxt->standalone = xmlParseSDDecl(ctxt);
 | |
| 
 | |
|     SKIP_BLANKS;
 | |
|     if ((RAW == '?') && (NXT(1) == '>')) {
 | |
|         SKIP(2);
 | |
|     } else if (RAW == '>') {
 | |
|         /* Deprecated old WD ... */
 | |
| 	xmlFatalErr(ctxt, XML_ERR_XMLDECL_NOT_FINISHED, NULL);
 | |
| 	NEXT;
 | |
|     } else {
 | |
|         int c;
 | |
| 
 | |
| 	xmlFatalErr(ctxt, XML_ERR_XMLDECL_NOT_FINISHED, NULL);
 | |
|         while ((c = CUR) != 0) {
 | |
|             NEXT;
 | |
|             if (c == '>')
 | |
|                 break;
 | |
|         }
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseMisc:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * DEPRECATED: Internal function, don't use.
 | |
|  *
 | |
|  * parse an XML Misc* optional field.
 | |
|  *
 | |
|  * [27] Misc ::= Comment | PI |  S
 | |
|  */
 | |
| 
 | |
| void
 | |
| xmlParseMisc(xmlParserCtxtPtr ctxt) {
 | |
|     while (ctxt->instate != XML_PARSER_EOF) {
 | |
|         SKIP_BLANKS;
 | |
|         GROW;
 | |
|         if ((RAW == '<') && (NXT(1) == '?')) {
 | |
| 	    xmlParsePI(ctxt);
 | |
|         } else if (CMP4(CUR_PTR, '<', '!', '-', '-')) {
 | |
| 	    xmlParseComment(ctxt);
 | |
|         } else {
 | |
|             break;
 | |
|         }
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseDocument:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * parse an XML document (and build a tree if using the standard SAX
 | |
|  * interface).
 | |
|  *
 | |
|  * [1] document ::= prolog element Misc*
 | |
|  *
 | |
|  * [22] prolog ::= XMLDecl? Misc* (doctypedecl Misc*)?
 | |
|  *
 | |
|  * Returns 0, -1 in case of error. the parser context is augmented
 | |
|  *                as a result of the parsing.
 | |
|  */
 | |
| 
 | |
| int
 | |
| xmlParseDocument(xmlParserCtxtPtr ctxt) {
 | |
|     xmlInitParser();
 | |
| 
 | |
|     if ((ctxt == NULL) || (ctxt->input == NULL))
 | |
|         return(-1);
 | |
| 
 | |
|     GROW;
 | |
| 
 | |
|     /*
 | |
|      * SAX: detecting the level.
 | |
|      */
 | |
|     xmlDetectSAX2(ctxt);
 | |
| 
 | |
|     /*
 | |
|      * SAX: beginning of the document processing.
 | |
|      */
 | |
|     if ((ctxt->sax) && (ctxt->sax->setDocumentLocator))
 | |
|         ctxt->sax->setDocumentLocator(ctxt->userData, &xmlDefaultSAXLocator);
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
| 	return(-1);
 | |
| 
 | |
|     xmlDetectEncoding(ctxt);
 | |
| 
 | |
|     if (CUR == 0) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_DOCUMENT_EMPTY, NULL);
 | |
| 	return(-1);
 | |
|     }
 | |
| 
 | |
|     GROW;
 | |
|     if ((CMP5(CUR_PTR, '<', '?', 'x', 'm', 'l')) && (IS_BLANK_CH(NXT(5)))) {
 | |
| 
 | |
| 	/*
 | |
| 	 * Note that we will switch encoding on the fly.
 | |
| 	 */
 | |
| 	xmlParseXMLDecl(ctxt);
 | |
| 	if ((ctxt->errNo == XML_ERR_UNSUPPORTED_ENCODING) ||
 | |
| 	    (ctxt->instate == XML_PARSER_EOF)) {
 | |
| 	    /*
 | |
| 	     * The XML REC instructs us to stop parsing right here
 | |
| 	     */
 | |
| 	    return(-1);
 | |
| 	}
 | |
| 	SKIP_BLANKS;
 | |
|     } else {
 | |
| 	ctxt->version = xmlCharStrdup(XML_DEFAULT_VERSION);
 | |
|     }
 | |
|     if ((ctxt->sax) && (ctxt->sax->startDocument) && (!ctxt->disableSAX))
 | |
|         ctxt->sax->startDocument(ctxt->userData);
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
| 	return(-1);
 | |
|     if ((ctxt->myDoc != NULL) && (ctxt->input != NULL) &&
 | |
|         (ctxt->input->buf != NULL) && (ctxt->input->buf->compressed >= 0)) {
 | |
| 	ctxt->myDoc->compression = ctxt->input->buf->compressed;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * The Misc part of the Prolog
 | |
|      */
 | |
|     xmlParseMisc(ctxt);
 | |
| 
 | |
|     /*
 | |
|      * Then possibly doc type declaration(s) and more Misc
 | |
|      * (doctypedecl Misc*)?
 | |
|      */
 | |
|     GROW;
 | |
|     if (CMP9(CUR_PTR, '<', '!', 'D', 'O', 'C', 'T', 'Y', 'P', 'E')) {
 | |
| 
 | |
| 	ctxt->inSubset = 1;
 | |
| 	xmlParseDocTypeDecl(ctxt);
 | |
| 	if (RAW == '[') {
 | |
| 	    ctxt->instate = XML_PARSER_DTD;
 | |
| 	    xmlParseInternalSubset(ctxt);
 | |
| 	    if (ctxt->instate == XML_PARSER_EOF)
 | |
| 		return(-1);
 | |
| 	}
 | |
| 
 | |
| 	/*
 | |
| 	 * Create and update the external subset.
 | |
| 	 */
 | |
| 	ctxt->inSubset = 2;
 | |
| 	if ((ctxt->sax != NULL) && (ctxt->sax->externalSubset != NULL) &&
 | |
| 	    (!ctxt->disableSAX))
 | |
| 	    ctxt->sax->externalSubset(ctxt->userData, ctxt->intSubName,
 | |
| 	                              ctxt->extSubSystem, ctxt->extSubURI);
 | |
| 	if (ctxt->instate == XML_PARSER_EOF)
 | |
| 	    return(-1);
 | |
| 	ctxt->inSubset = 0;
 | |
| 
 | |
|         xmlCleanSpecialAttr(ctxt);
 | |
| 
 | |
| 	ctxt->instate = XML_PARSER_PROLOG;
 | |
| 	xmlParseMisc(ctxt);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Time to start parsing the tree itself
 | |
|      */
 | |
|     GROW;
 | |
|     if (RAW != '<') {
 | |
| 	xmlFatalErrMsg(ctxt, XML_ERR_DOCUMENT_EMPTY,
 | |
| 		       "Start tag expected, '<' not found\n");
 | |
|     } else {
 | |
| 	ctxt->instate = XML_PARSER_CONTENT;
 | |
| 	xmlParseElement(ctxt);
 | |
| 	ctxt->instate = XML_PARSER_EPILOG;
 | |
| 
 | |
| 
 | |
| 	/*
 | |
| 	 * The Misc part at the end
 | |
| 	 */
 | |
| 	xmlParseMisc(ctxt);
 | |
| 
 | |
|         if (ctxt->input->cur < ctxt->input->end) {
 | |
|             if (ctxt->errNo == XML_ERR_OK)
 | |
| 	        xmlFatalErr(ctxt, XML_ERR_DOCUMENT_END, NULL);
 | |
|         } else if ((ctxt->input->buf != NULL) &&
 | |
|                    (ctxt->input->buf->encoder != NULL) &&
 | |
|                    (!xmlBufIsEmpty(ctxt->input->buf->raw))) {
 | |
|             xmlFatalErrMsg(ctxt, XML_ERR_INVALID_CHAR,
 | |
|                            "Truncated multi-byte sequence at EOF\n");
 | |
|         }
 | |
| 	ctxt->instate = XML_PARSER_EOF;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * SAX: end of the document processing.
 | |
|      */
 | |
|     if ((ctxt->sax) && (ctxt->sax->endDocument != NULL))
 | |
|         ctxt->sax->endDocument(ctxt->userData);
 | |
| 
 | |
|     /*
 | |
|      * Remove locally kept entity definitions if the tree was not built
 | |
|      */
 | |
|     if ((ctxt->myDoc != NULL) &&
 | |
| 	(xmlStrEqual(ctxt->myDoc->version, SAX_COMPAT_MODE))) {
 | |
| 	xmlFreeDoc(ctxt->myDoc);
 | |
| 	ctxt->myDoc = NULL;
 | |
|     }
 | |
| 
 | |
|     if ((ctxt->wellFormed) && (ctxt->myDoc != NULL)) {
 | |
|         ctxt->myDoc->properties |= XML_DOC_WELLFORMED;
 | |
| 	if (ctxt->valid)
 | |
| 	    ctxt->myDoc->properties |= XML_DOC_DTDVALID;
 | |
| 	if (ctxt->nsWellFormed)
 | |
| 	    ctxt->myDoc->properties |= XML_DOC_NSVALID;
 | |
| 	if (ctxt->options & XML_PARSE_OLD10)
 | |
| 	    ctxt->myDoc->properties |= XML_DOC_OLD10;
 | |
|     }
 | |
|     if (! ctxt->wellFormed) {
 | |
| 	ctxt->valid = 0;
 | |
| 	return(-1);
 | |
|     }
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseExtParsedEnt:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * parse a general parsed entity
 | |
|  * An external general parsed entity is well-formed if it matches the
 | |
|  * production labeled extParsedEnt.
 | |
|  *
 | |
|  * [78] extParsedEnt ::= TextDecl? content
 | |
|  *
 | |
|  * Returns 0, -1 in case of error. the parser context is augmented
 | |
|  *                as a result of the parsing.
 | |
|  */
 | |
| 
 | |
| int
 | |
| xmlParseExtParsedEnt(xmlParserCtxtPtr ctxt) {
 | |
|     if ((ctxt == NULL) || (ctxt->input == NULL))
 | |
|         return(-1);
 | |
| 
 | |
|     xmlDetectSAX2(ctxt);
 | |
| 
 | |
|     /*
 | |
|      * SAX: beginning of the document processing.
 | |
|      */
 | |
|     if ((ctxt->sax) && (ctxt->sax->setDocumentLocator))
 | |
|         ctxt->sax->setDocumentLocator(ctxt->userData, &xmlDefaultSAXLocator);
 | |
| 
 | |
|     xmlDetectEncoding(ctxt);
 | |
| 
 | |
|     if (CUR == 0) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_DOCUMENT_EMPTY, NULL);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Check for the XMLDecl in the Prolog.
 | |
|      */
 | |
|     GROW;
 | |
|     if ((CMP5(CUR_PTR, '<', '?', 'x', 'm', 'l')) && (IS_BLANK_CH(NXT(5)))) {
 | |
| 
 | |
| 	/*
 | |
| 	 * Note that we will switch encoding on the fly.
 | |
| 	 */
 | |
| 	xmlParseXMLDecl(ctxt);
 | |
| 	if (ctxt->errNo == XML_ERR_UNSUPPORTED_ENCODING) {
 | |
| 	    /*
 | |
| 	     * The XML REC instructs us to stop parsing right here
 | |
| 	     */
 | |
| 	    return(-1);
 | |
| 	}
 | |
| 	SKIP_BLANKS;
 | |
|     } else {
 | |
| 	ctxt->version = xmlCharStrdup(XML_DEFAULT_VERSION);
 | |
|     }
 | |
|     if ((ctxt->sax) && (ctxt->sax->startDocument) && (!ctxt->disableSAX))
 | |
|         ctxt->sax->startDocument(ctxt->userData);
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
| 	return(-1);
 | |
| 
 | |
|     /*
 | |
|      * Doing validity checking on chunk doesn't make sense
 | |
|      */
 | |
|     ctxt->instate = XML_PARSER_CONTENT;
 | |
|     ctxt->validate = 0;
 | |
|     ctxt->loadsubset = 0;
 | |
|     ctxt->depth = 0;
 | |
| 
 | |
|     xmlParseContent(ctxt);
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
| 	return(-1);
 | |
| 
 | |
|     if ((RAW == '<') && (NXT(1) == '/')) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_NOT_WELL_BALANCED, NULL);
 | |
|     } else if (RAW != 0) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_EXTRA_CONTENT, NULL);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * SAX: end of the document processing.
 | |
|      */
 | |
|     if ((ctxt->sax) && (ctxt->sax->endDocument != NULL))
 | |
|         ctxt->sax->endDocument(ctxt->userData);
 | |
| 
 | |
|     if (! ctxt->wellFormed) return(-1);
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| #ifdef LIBXML_PUSH_ENABLED
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		Progressive parsing interfaces				*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * xmlParseLookupChar:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @c:  character
 | |
|  *
 | |
|  * Check whether the input buffer contains a character.
 | |
|  */
 | |
| static int
 | |
| xmlParseLookupChar(xmlParserCtxtPtr ctxt, int c) {
 | |
|     const xmlChar *cur;
 | |
| 
 | |
|     if (ctxt->checkIndex == 0) {
 | |
|         cur = ctxt->input->cur + 1;
 | |
|     } else {
 | |
|         cur = ctxt->input->cur + ctxt->checkIndex;
 | |
|     }
 | |
| 
 | |
|     if (memchr(cur, c, ctxt->input->end - cur) == NULL) {
 | |
|         size_t index = ctxt->input->end - ctxt->input->cur;
 | |
| 
 | |
|         if (index > LONG_MAX) {
 | |
|             ctxt->checkIndex = 0;
 | |
|             return(1);
 | |
|         }
 | |
|         ctxt->checkIndex = index;
 | |
|         return(0);
 | |
|     } else {
 | |
|         ctxt->checkIndex = 0;
 | |
|         return(1);
 | |
|     }
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseLookupString:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @startDelta: delta to apply at the start
 | |
|  * @str:  string
 | |
|  * @strLen:  length of string
 | |
|  *
 | |
|  * Check whether the input buffer contains a string.
 | |
|  */
 | |
| static const xmlChar *
 | |
| xmlParseLookupString(xmlParserCtxtPtr ctxt, size_t startDelta,
 | |
|                      const char *str, size_t strLen) {
 | |
|     const xmlChar *cur, *term;
 | |
| 
 | |
|     if (ctxt->checkIndex == 0) {
 | |
|         cur = ctxt->input->cur + startDelta;
 | |
|     } else {
 | |
|         cur = ctxt->input->cur + ctxt->checkIndex;
 | |
|     }
 | |
| 
 | |
|     term = BAD_CAST strstr((const char *) cur, str);
 | |
|     if (term == NULL) {
 | |
|         const xmlChar *end = ctxt->input->end;
 | |
|         size_t index;
 | |
| 
 | |
|         /* Rescan (strLen - 1) characters. */
 | |
|         if ((size_t) (end - cur) < strLen)
 | |
|             end = cur;
 | |
|         else
 | |
|             end -= strLen - 1;
 | |
|         index = end - ctxt->input->cur;
 | |
|         if (index > LONG_MAX) {
 | |
|             ctxt->checkIndex = 0;
 | |
|             return(ctxt->input->end - strLen);
 | |
|         }
 | |
|         ctxt->checkIndex = index;
 | |
|     } else {
 | |
|         ctxt->checkIndex = 0;
 | |
|     }
 | |
| 
 | |
|     return(term);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseLookupCharData:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * Check whether the input buffer contains terminated char data.
 | |
|  */
 | |
| static int
 | |
| xmlParseLookupCharData(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *cur = ctxt->input->cur + ctxt->checkIndex;
 | |
|     const xmlChar *end = ctxt->input->end;
 | |
|     size_t index;
 | |
| 
 | |
|     while (cur < end) {
 | |
|         if ((*cur == '<') || (*cur == '&')) {
 | |
|             ctxt->checkIndex = 0;
 | |
|             return(1);
 | |
|         }
 | |
|         cur++;
 | |
|     }
 | |
| 
 | |
|     index = cur - ctxt->input->cur;
 | |
|     if (index > LONG_MAX) {
 | |
|         ctxt->checkIndex = 0;
 | |
|         return(1);
 | |
|     }
 | |
|     ctxt->checkIndex = index;
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseLookupGt:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * Check whether there's enough data in the input buffer to finish parsing
 | |
|  * a start tag. This has to take quotes into account.
 | |
|  */
 | |
| static int
 | |
| xmlParseLookupGt(xmlParserCtxtPtr ctxt) {
 | |
|     const xmlChar *cur;
 | |
|     const xmlChar *end = ctxt->input->end;
 | |
|     int state = ctxt->endCheckState;
 | |
|     size_t index;
 | |
| 
 | |
|     if (ctxt->checkIndex == 0)
 | |
|         cur = ctxt->input->cur + 1;
 | |
|     else
 | |
|         cur = ctxt->input->cur + ctxt->checkIndex;
 | |
| 
 | |
|     while (cur < end) {
 | |
|         if (state) {
 | |
|             if (*cur == state)
 | |
|                 state = 0;
 | |
|         } else if (*cur == '\'' || *cur == '"') {
 | |
|             state = *cur;
 | |
|         } else if (*cur == '>') {
 | |
|             ctxt->checkIndex = 0;
 | |
|             ctxt->endCheckState = 0;
 | |
|             return(1);
 | |
|         }
 | |
|         cur++;
 | |
|     }
 | |
| 
 | |
|     index = cur - ctxt->input->cur;
 | |
|     if (index > LONG_MAX) {
 | |
|         ctxt->checkIndex = 0;
 | |
|         ctxt->endCheckState = 0;
 | |
|         return(1);
 | |
|     }
 | |
|     ctxt->checkIndex = index;
 | |
|     ctxt->endCheckState = state;
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseLookupInternalSubset:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * Check whether there's enough data in the input buffer to finish parsing
 | |
|  * the internal subset.
 | |
|  */
 | |
| static int
 | |
| xmlParseLookupInternalSubset(xmlParserCtxtPtr ctxt) {
 | |
|     /*
 | |
|      * Sorry, but progressive parsing of the internal subset is not
 | |
|      * supported. We first check that the full content of the internal
 | |
|      * subset is available and parsing is launched only at that point.
 | |
|      * Internal subset ends with "']' S? '>'" in an unescaped section and
 | |
|      * not in a ']]>' sequence which are conditional sections.
 | |
|      */
 | |
|     const xmlChar *cur, *start;
 | |
|     const xmlChar *end = ctxt->input->end;
 | |
|     int state = ctxt->endCheckState;
 | |
|     size_t index;
 | |
| 
 | |
|     if (ctxt->checkIndex == 0) {
 | |
|         cur = ctxt->input->cur + 1;
 | |
|     } else {
 | |
|         cur = ctxt->input->cur + ctxt->checkIndex;
 | |
|     }
 | |
|     start = cur;
 | |
| 
 | |
|     while (cur < end) {
 | |
|         if (state == '-') {
 | |
|             if ((*cur == '-') &&
 | |
|                 (cur[1] == '-') &&
 | |
|                 (cur[2] == '>')) {
 | |
|                 state = 0;
 | |
|                 cur += 3;
 | |
|                 start = cur;
 | |
|                 continue;
 | |
|             }
 | |
|         }
 | |
|         else if (state == ']') {
 | |
|             if (*cur == '>') {
 | |
|                 ctxt->checkIndex = 0;
 | |
|                 ctxt->endCheckState = 0;
 | |
|                 return(1);
 | |
|             }
 | |
|             if (IS_BLANK_CH(*cur)) {
 | |
|                 state = ' ';
 | |
|             } else if (*cur != ']') {
 | |
|                 state = 0;
 | |
|                 start = cur;
 | |
|                 continue;
 | |
|             }
 | |
|         }
 | |
|         else if (state == ' ') {
 | |
|             if (*cur == '>') {
 | |
|                 ctxt->checkIndex = 0;
 | |
|                 ctxt->endCheckState = 0;
 | |
|                 return(1);
 | |
|             }
 | |
|             if (!IS_BLANK_CH(*cur)) {
 | |
|                 state = 0;
 | |
|                 start = cur;
 | |
|                 continue;
 | |
|             }
 | |
|         }
 | |
|         else if (state != 0) {
 | |
|             if (*cur == state) {
 | |
|                 state = 0;
 | |
|                 start = cur + 1;
 | |
|             }
 | |
|         }
 | |
|         else if (*cur == '<') {
 | |
|             if ((cur[1] == '!') &&
 | |
|                 (cur[2] == '-') &&
 | |
|                 (cur[3] == '-')) {
 | |
|                 state = '-';
 | |
|                 cur += 4;
 | |
|                 /* Don't treat <!--> as comment */
 | |
|                 start = cur;
 | |
|                 continue;
 | |
|             }
 | |
|         }
 | |
|         else if ((*cur == '"') || (*cur == '\'') || (*cur == ']')) {
 | |
|             state = *cur;
 | |
|         }
 | |
| 
 | |
|         cur++;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Rescan the three last characters to detect "<!--" and "-->"
 | |
|      * split across chunks.
 | |
|      */
 | |
|     if ((state == 0) || (state == '-')) {
 | |
|         if (cur - start < 3)
 | |
|             cur = start;
 | |
|         else
 | |
|             cur -= 3;
 | |
|     }
 | |
|     index = cur - ctxt->input->cur;
 | |
|     if (index > LONG_MAX) {
 | |
|         ctxt->checkIndex = 0;
 | |
|         ctxt->endCheckState = 0;
 | |
|         return(1);
 | |
|     }
 | |
|     ctxt->checkIndex = index;
 | |
|     ctxt->endCheckState = state;
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCheckCdataPush:
 | |
|  * @cur: pointer to the block of characters
 | |
|  * @len: length of the block in bytes
 | |
|  * @complete: 1 if complete CDATA block is passed in, 0 if partial block
 | |
|  *
 | |
|  * Check that the block of characters is okay as SCdata content [20]
 | |
|  *
 | |
|  * Returns the number of bytes to pass if okay, a negative index where an
 | |
|  *         UTF-8 error occurred otherwise
 | |
|  */
 | |
| static int
 | |
| xmlCheckCdataPush(const xmlChar *utf, int len, int complete) {
 | |
|     int ix;
 | |
|     unsigned char c;
 | |
|     int codepoint;
 | |
| 
 | |
|     if ((utf == NULL) || (len <= 0))
 | |
|         return(0);
 | |
| 
 | |
|     for (ix = 0; ix < len;) {      /* string is 0-terminated */
 | |
|         c = utf[ix];
 | |
|         if ((c & 0x80) == 0x00) {	/* 1-byte code, starts with 10 */
 | |
| 	    if (c >= 0x20)
 | |
| 		ix++;
 | |
| 	    else if ((c == 0xA) || (c == 0xD) || (c == 0x9))
 | |
| 	        ix++;
 | |
| 	    else
 | |
| 	        return(-ix);
 | |
| 	} else if ((c & 0xe0) == 0xc0) {/* 2-byte code, starts with 110 */
 | |
| 	    if (ix + 2 > len) return(complete ? -ix : ix);
 | |
| 	    if ((utf[ix+1] & 0xc0 ) != 0x80)
 | |
| 	        return(-ix);
 | |
| 	    codepoint = (utf[ix] & 0x1f) << 6;
 | |
| 	    codepoint |= utf[ix+1] & 0x3f;
 | |
| 	    if (!xmlIsCharQ(codepoint))
 | |
| 	        return(-ix);
 | |
| 	    ix += 2;
 | |
| 	} else if ((c & 0xf0) == 0xe0) {/* 3-byte code, starts with 1110 */
 | |
| 	    if (ix + 3 > len) return(complete ? -ix : ix);
 | |
| 	    if (((utf[ix+1] & 0xc0) != 0x80) ||
 | |
| 	        ((utf[ix+2] & 0xc0) != 0x80))
 | |
| 		    return(-ix);
 | |
| 	    codepoint = (utf[ix] & 0xf) << 12;
 | |
| 	    codepoint |= (utf[ix+1] & 0x3f) << 6;
 | |
| 	    codepoint |= utf[ix+2] & 0x3f;
 | |
| 	    if (!xmlIsCharQ(codepoint))
 | |
| 	        return(-ix);
 | |
| 	    ix += 3;
 | |
| 	} else if ((c & 0xf8) == 0xf0) {/* 4-byte code, starts with 11110 */
 | |
| 	    if (ix + 4 > len) return(complete ? -ix : ix);
 | |
| 	    if (((utf[ix+1] & 0xc0) != 0x80) ||
 | |
| 	        ((utf[ix+2] & 0xc0) != 0x80) ||
 | |
| 		((utf[ix+3] & 0xc0) != 0x80))
 | |
| 		    return(-ix);
 | |
| 	    codepoint = (utf[ix] & 0x7) << 18;
 | |
| 	    codepoint |= (utf[ix+1] & 0x3f) << 12;
 | |
| 	    codepoint |= (utf[ix+2] & 0x3f) << 6;
 | |
| 	    codepoint |= utf[ix+3] & 0x3f;
 | |
| 	    if (!xmlIsCharQ(codepoint))
 | |
| 	        return(-ix);
 | |
| 	    ix += 4;
 | |
| 	} else				/* unknown encoding */
 | |
| 	    return(-ix);
 | |
|       }
 | |
|       return(ix);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseTryOrFinish:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @terminate:  last chunk indicator
 | |
|  *
 | |
|  * Try to progress on parsing
 | |
|  *
 | |
|  * Returns zero if no parsing was possible
 | |
|  */
 | |
| static int
 | |
| xmlParseTryOrFinish(xmlParserCtxtPtr ctxt, int terminate) {
 | |
|     int ret = 0;
 | |
|     size_t avail;
 | |
|     xmlChar cur, next;
 | |
| 
 | |
|     if (ctxt->input == NULL)
 | |
|         return(0);
 | |
| 
 | |
|     if ((ctxt->input != NULL) &&
 | |
|         (ctxt->input->cur - ctxt->input->base > 4096)) {
 | |
|         xmlParserShrink(ctxt);
 | |
|     }
 | |
| 
 | |
|     while (ctxt->instate != XML_PARSER_EOF) {
 | |
| 	if ((ctxt->errNo != XML_ERR_OK) && (ctxt->disableSAX == 1))
 | |
| 	    return(0);
 | |
| 
 | |
|         avail = ctxt->input->end - ctxt->input->cur;
 | |
|         if (avail < 1)
 | |
| 	    goto done;
 | |
|         switch (ctxt->instate) {
 | |
|             case XML_PARSER_EOF:
 | |
| 	        /*
 | |
| 		 * Document parsing is done !
 | |
| 		 */
 | |
| 	        goto done;
 | |
|             case XML_PARSER_START:
 | |
|                 /*
 | |
|                  * Very first chars read from the document flow.
 | |
|                  */
 | |
|                 if ((!terminate) && (avail < 4))
 | |
|                     goto done;
 | |
| 
 | |
|                 /*
 | |
|                  * We need more bytes to detect EBCDIC code pages.
 | |
|                  * See xmlDetectEBCDIC.
 | |
|                  */
 | |
|                 if ((CMP4(CUR_PTR, 0x4C, 0x6F, 0xA7, 0x94)) &&
 | |
|                     (!terminate) && (avail < 200))
 | |
|                     goto done;
 | |
| 
 | |
|                 xmlDetectEncoding(ctxt);
 | |
|                 if (ctxt->instate == XML_PARSER_EOF)
 | |
|                     goto done;
 | |
|                 ctxt->instate = XML_PARSER_XML_DECL;
 | |
| 		break;
 | |
| 
 | |
|             case XML_PARSER_XML_DECL:
 | |
| 		if ((!terminate) && (avail < 2))
 | |
| 		    goto done;
 | |
| 		cur = ctxt->input->cur[0];
 | |
| 		next = ctxt->input->cur[1];
 | |
| 	        if ((cur == '<') && (next == '?')) {
 | |
| 		    /* PI or XML decl */
 | |
| 		    if ((!terminate) &&
 | |
|                         (!xmlParseLookupString(ctxt, 2, "?>", 2)))
 | |
| 			goto done;
 | |
| 		    if ((ctxt->input->cur[2] == 'x') &&
 | |
| 			(ctxt->input->cur[3] == 'm') &&
 | |
| 			(ctxt->input->cur[4] == 'l') &&
 | |
| 			(IS_BLANK_CH(ctxt->input->cur[5]))) {
 | |
| 			ret += 5;
 | |
| 			xmlParseXMLDecl(ctxt);
 | |
| 			if (ctxt->errNo == XML_ERR_UNSUPPORTED_ENCODING) {
 | |
| 			    /*
 | |
| 			     * The XML REC instructs us to stop parsing right
 | |
| 			     * here
 | |
| 			     */
 | |
| 			    xmlHaltParser(ctxt);
 | |
| 			    return(0);
 | |
| 			}
 | |
| 		    } else {
 | |
| 			ctxt->version = xmlCharStrdup(XML_DEFAULT_VERSION);
 | |
| 		    }
 | |
| 		} else {
 | |
| 		    ctxt->version = xmlCharStrdup(XML_DEFAULT_VERSION);
 | |
| 		    if (ctxt->version == NULL) {
 | |
| 		        xmlErrMemory(ctxt, NULL);
 | |
| 			break;
 | |
| 		    }
 | |
| 		}
 | |
|                 if ((ctxt->sax) && (ctxt->sax->setDocumentLocator))
 | |
|                     ctxt->sax->setDocumentLocator(ctxt->userData,
 | |
|                                                   &xmlDefaultSAXLocator);
 | |
|                 if ((ctxt->sax) && (ctxt->sax->startDocument) &&
 | |
|                     (!ctxt->disableSAX))
 | |
|                     ctxt->sax->startDocument(ctxt->userData);
 | |
|                 if (ctxt->instate == XML_PARSER_EOF)
 | |
|                     goto done;
 | |
|                 ctxt->instate = XML_PARSER_MISC;
 | |
| 		break;
 | |
|             case XML_PARSER_START_TAG: {
 | |
| 	        const xmlChar *name;
 | |
| 		const xmlChar *prefix = NULL;
 | |
| 		const xmlChar *URI = NULL;
 | |
|                 int line = ctxt->input->line;
 | |
| 		int nbNs = 0;
 | |
| 
 | |
| 		if ((!terminate) && (avail < 2))
 | |
| 		    goto done;
 | |
| 		cur = ctxt->input->cur[0];
 | |
| 	        if (cur != '<') {
 | |
| 		    xmlFatalErrMsg(ctxt, XML_ERR_DOCUMENT_EMPTY,
 | |
|                                    "Start tag expected, '<' not found");
 | |
| 		    xmlHaltParser(ctxt);
 | |
| 		    if ((ctxt->sax) && (ctxt->sax->endDocument != NULL))
 | |
| 			ctxt->sax->endDocument(ctxt->userData);
 | |
| 		    goto done;
 | |
| 		}
 | |
| 		if ((!terminate) && (!xmlParseLookupGt(ctxt)))
 | |
|                     goto done;
 | |
| 		if (ctxt->spaceNr == 0)
 | |
| 		    spacePush(ctxt, -1);
 | |
| 		else if (*ctxt->space == -2)
 | |
| 		    spacePush(ctxt, -1);
 | |
| 		else
 | |
| 		    spacePush(ctxt, *ctxt->space);
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
| 		if (ctxt->sax2)
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
| 		    name = xmlParseStartTag2(ctxt, &prefix, &URI, &nbNs);
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
| 		else
 | |
| 		    name = xmlParseStartTag(ctxt);
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
| 		if (ctxt->instate == XML_PARSER_EOF)
 | |
| 		    goto done;
 | |
| 		if (name == NULL) {
 | |
| 		    spacePop(ctxt);
 | |
| 		    xmlHaltParser(ctxt);
 | |
| 		    if ((ctxt->sax) && (ctxt->sax->endDocument != NULL))
 | |
| 			ctxt->sax->endDocument(ctxt->userData);
 | |
| 		    goto done;
 | |
| 		}
 | |
| #ifdef LIBXML_VALID_ENABLED
 | |
| 		/*
 | |
| 		 * [ VC: Root Element Type ]
 | |
| 		 * The Name in the document type declaration must match
 | |
| 		 * the element type of the root element.
 | |
| 		 */
 | |
| 		if (ctxt->validate && ctxt->wellFormed && ctxt->myDoc &&
 | |
| 		    ctxt->node && (ctxt->node == ctxt->myDoc->children))
 | |
| 		    ctxt->valid &= xmlValidateRoot(&ctxt->vctxt, ctxt->myDoc);
 | |
| #endif /* LIBXML_VALID_ENABLED */
 | |
| 
 | |
| 		/*
 | |
| 		 * Check for an Empty Element.
 | |
| 		 */
 | |
| 		if ((RAW == '/') && (NXT(1) == '>')) {
 | |
| 		    SKIP(2);
 | |
| 
 | |
| 		    if (ctxt->sax2) {
 | |
| 			if ((ctxt->sax != NULL) &&
 | |
| 			    (ctxt->sax->endElementNs != NULL) &&
 | |
| 			    (!ctxt->disableSAX))
 | |
| 			    ctxt->sax->endElementNs(ctxt->userData, name,
 | |
| 			                            prefix, URI);
 | |
| 			if (nbNs > 0)
 | |
| 			    xmlParserNsPop(ctxt, nbNs);
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
| 		    } else {
 | |
| 			if ((ctxt->sax != NULL) &&
 | |
| 			    (ctxt->sax->endElement != NULL) &&
 | |
| 			    (!ctxt->disableSAX))
 | |
| 			    ctxt->sax->endElement(ctxt->userData, name);
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
| 		    }
 | |
| 		    spacePop(ctxt);
 | |
| 		} else if (RAW == '>') {
 | |
| 		    NEXT;
 | |
|                     nameNsPush(ctxt, name, prefix, URI, line, nbNs);
 | |
| 		} else {
 | |
| 		    xmlFatalErrMsgStr(ctxt, XML_ERR_GT_REQUIRED,
 | |
| 					 "Couldn't find end of Start Tag %s\n",
 | |
| 					 name);
 | |
| 		    nodePop(ctxt);
 | |
| 		    spacePop(ctxt);
 | |
|                     if (nbNs > 0)
 | |
|                         xmlParserNsPop(ctxt, nbNs);
 | |
| 		}
 | |
| 
 | |
|                 if (ctxt->instate == XML_PARSER_EOF)
 | |
|                     goto done;
 | |
|                 if (ctxt->nameNr == 0)
 | |
|                     ctxt->instate = XML_PARSER_EPILOG;
 | |
|                 else
 | |
|                     ctxt->instate = XML_PARSER_CONTENT;
 | |
|                 break;
 | |
| 	    }
 | |
|             case XML_PARSER_CONTENT: {
 | |
| 		cur = ctxt->input->cur[0];
 | |
| 
 | |
| 		if (cur == '<') {
 | |
|                     if ((!terminate) && (avail < 2))
 | |
|                         goto done;
 | |
| 		    next = ctxt->input->cur[1];
 | |
| 
 | |
|                     if (next == '/') {
 | |
|                         ctxt->instate = XML_PARSER_END_TAG;
 | |
|                         break;
 | |
|                     } else if (next == '?') {
 | |
|                         if ((!terminate) &&
 | |
|                             (!xmlParseLookupString(ctxt, 2, "?>", 2)))
 | |
|                             goto done;
 | |
|                         xmlParsePI(ctxt);
 | |
|                         if (ctxt->instate == XML_PARSER_EOF)
 | |
|                             goto done;
 | |
|                         ctxt->instate = XML_PARSER_CONTENT;
 | |
|                         break;
 | |
|                     } else if (next == '!') {
 | |
|                         if ((!terminate) && (avail < 3))
 | |
|                             goto done;
 | |
|                         next = ctxt->input->cur[2];
 | |
| 
 | |
|                         if (next == '-') {
 | |
|                             if ((!terminate) && (avail < 4))
 | |
|                                 goto done;
 | |
|                             if (ctxt->input->cur[3] == '-') {
 | |
|                                 if ((!terminate) &&
 | |
|                                     (!xmlParseLookupString(ctxt, 4, "-->", 3)))
 | |
|                                     goto done;
 | |
|                                 xmlParseComment(ctxt);
 | |
|                                 if (ctxt->instate == XML_PARSER_EOF)
 | |
|                                     goto done;
 | |
|                                 ctxt->instate = XML_PARSER_CONTENT;
 | |
|                                 break;
 | |
|                             }
 | |
|                         } else if (next == '[') {
 | |
|                             if ((!terminate) && (avail < 9))
 | |
|                                 goto done;
 | |
|                             if ((ctxt->input->cur[2] == '[') &&
 | |
|                                 (ctxt->input->cur[3] == 'C') &&
 | |
|                                 (ctxt->input->cur[4] == 'D') &&
 | |
|                                 (ctxt->input->cur[5] == 'A') &&
 | |
|                                 (ctxt->input->cur[6] == 'T') &&
 | |
|                                 (ctxt->input->cur[7] == 'A') &&
 | |
|                                 (ctxt->input->cur[8] == '[')) {
 | |
|                                 SKIP(9);
 | |
|                                 ctxt->instate = XML_PARSER_CDATA_SECTION;
 | |
|                                 break;
 | |
|                             }
 | |
|                         }
 | |
|                     }
 | |
| 		} else if (cur == '&') {
 | |
| 		    if ((!terminate) && (!xmlParseLookupChar(ctxt, ';')))
 | |
| 			goto done;
 | |
| 		    xmlParseReference(ctxt);
 | |
|                     break;
 | |
| 		} else {
 | |
| 		    /* TODO Avoid the extra copy, handle directly !!! */
 | |
| 		    /*
 | |
| 		     * Goal of the following test is:
 | |
| 		     *  - minimize calls to the SAX 'character' callback
 | |
| 		     *    when they are mergeable
 | |
| 		     *  - handle an problem for isBlank when we only parse
 | |
| 		     *    a sequence of blank chars and the next one is
 | |
| 		     *    not available to check against '<' presence.
 | |
| 		     *  - tries to homogenize the differences in SAX
 | |
| 		     *    callbacks between the push and pull versions
 | |
| 		     *    of the parser.
 | |
| 		     */
 | |
| 		    if (avail < XML_PARSER_BIG_BUFFER_SIZE) {
 | |
| 			if ((!terminate) && (!xmlParseLookupCharData(ctxt)))
 | |
| 			    goto done;
 | |
|                     }
 | |
|                     ctxt->checkIndex = 0;
 | |
| 		    xmlParseCharDataInternal(ctxt, !terminate);
 | |
|                     break;
 | |
| 		}
 | |
| 
 | |
|                 ctxt->instate = XML_PARSER_START_TAG;
 | |
| 		break;
 | |
| 	    }
 | |
|             case XML_PARSER_END_TAG:
 | |
| 		if ((!terminate) && (!xmlParseLookupChar(ctxt, '>')))
 | |
| 		    goto done;
 | |
| 		if (ctxt->sax2) {
 | |
| 	            xmlParseEndTag2(ctxt, &ctxt->pushTab[ctxt->nameNr - 1]);
 | |
| 		    nameNsPop(ctxt);
 | |
| 		}
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
| 		  else
 | |
| 		    xmlParseEndTag1(ctxt, 0);
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
|                 if (ctxt->instate == XML_PARSER_EOF)
 | |
|                     goto done;
 | |
| 		if (ctxt->nameNr == 0) {
 | |
| 		    ctxt->instate = XML_PARSER_EPILOG;
 | |
| 		} else {
 | |
| 		    ctxt->instate = XML_PARSER_CONTENT;
 | |
| 		}
 | |
| 		break;
 | |
|             case XML_PARSER_CDATA_SECTION: {
 | |
| 	        /*
 | |
| 		 * The Push mode need to have the SAX callback for
 | |
| 		 * cdataBlock merge back contiguous callbacks.
 | |
| 		 */
 | |
| 		const xmlChar *term;
 | |
| 
 | |
|                 if (terminate) {
 | |
|                     /*
 | |
|                      * Don't call xmlParseLookupString. If 'terminate'
 | |
|                      * is set, checkIndex is invalid.
 | |
|                      */
 | |
|                     term = BAD_CAST strstr((const char *) ctxt->input->cur,
 | |
|                                            "]]>");
 | |
|                 } else {
 | |
| 		    term = xmlParseLookupString(ctxt, 0, "]]>", 3);
 | |
|                 }
 | |
| 
 | |
| 		if (term == NULL) {
 | |
| 		    int tmp, size;
 | |
| 
 | |
|                     if (terminate) {
 | |
|                         /* Unfinished CDATA section */
 | |
|                         size = ctxt->input->end - ctxt->input->cur;
 | |
|                     } else {
 | |
|                         if (avail < XML_PARSER_BIG_BUFFER_SIZE + 2)
 | |
|                             goto done;
 | |
|                         ctxt->checkIndex = 0;
 | |
|                         /* XXX: Why don't we pass the full buffer? */
 | |
|                         size = XML_PARSER_BIG_BUFFER_SIZE;
 | |
|                     }
 | |
|                     tmp = xmlCheckCdataPush(ctxt->input->cur, size, 0);
 | |
|                     if (tmp <= 0) {
 | |
|                         tmp = -tmp;
 | |
|                         ctxt->input->cur += tmp;
 | |
|                         goto encoding_error;
 | |
|                     }
 | |
|                     if ((ctxt->sax != NULL) && (!ctxt->disableSAX)) {
 | |
|                         if (ctxt->sax->cdataBlock != NULL)
 | |
|                             ctxt->sax->cdataBlock(ctxt->userData,
 | |
|                                                   ctxt->input->cur, tmp);
 | |
|                         else if (ctxt->sax->characters != NULL)
 | |
|                             ctxt->sax->characters(ctxt->userData,
 | |
|                                                   ctxt->input->cur, tmp);
 | |
|                     }
 | |
|                     if (ctxt->instate == XML_PARSER_EOF)
 | |
|                         goto done;
 | |
|                     SKIPL(tmp);
 | |
| 		} else {
 | |
|                     int base = term - CUR_PTR;
 | |
| 		    int tmp;
 | |
| 
 | |
| 		    tmp = xmlCheckCdataPush(ctxt->input->cur, base, 1);
 | |
| 		    if ((tmp < 0) || (tmp != base)) {
 | |
| 			tmp = -tmp;
 | |
| 			ctxt->input->cur += tmp;
 | |
| 			goto encoding_error;
 | |
| 		    }
 | |
| 		    if ((ctxt->sax != NULL) && (base == 0) &&
 | |
| 		        (ctxt->sax->cdataBlock != NULL) &&
 | |
| 		        (!ctxt->disableSAX)) {
 | |
| 			/*
 | |
| 			 * Special case to provide identical behaviour
 | |
| 			 * between pull and push parsers on enpty CDATA
 | |
| 			 * sections
 | |
| 			 */
 | |
| 			 if ((ctxt->input->cur - ctxt->input->base >= 9) &&
 | |
| 			     (!strncmp((const char *)&ctxt->input->cur[-9],
 | |
| 			               "<![CDATA[", 9)))
 | |
| 			     ctxt->sax->cdataBlock(ctxt->userData,
 | |
| 			                           BAD_CAST "", 0);
 | |
| 		    } else if ((ctxt->sax != NULL) && (base > 0) &&
 | |
| 			(!ctxt->disableSAX)) {
 | |
| 			if (ctxt->sax->cdataBlock != NULL)
 | |
| 			    ctxt->sax->cdataBlock(ctxt->userData,
 | |
| 						  ctxt->input->cur, base);
 | |
| 			else if (ctxt->sax->characters != NULL)
 | |
| 			    ctxt->sax->characters(ctxt->userData,
 | |
| 						  ctxt->input->cur, base);
 | |
| 		    }
 | |
| 		    if (ctxt->instate == XML_PARSER_EOF)
 | |
| 			goto done;
 | |
| 		    SKIPL(base + 3);
 | |
| 		    ctxt->instate = XML_PARSER_CONTENT;
 | |
| 		}
 | |
| 		break;
 | |
| 	    }
 | |
|             case XML_PARSER_MISC:
 | |
|             case XML_PARSER_PROLOG:
 | |
|             case XML_PARSER_EPILOG:
 | |
| 		SKIP_BLANKS;
 | |
|                 avail = ctxt->input->end - ctxt->input->cur;
 | |
| 		if (avail < 1)
 | |
| 		    goto done;
 | |
| 		if (ctxt->input->cur[0] == '<') {
 | |
|                     if ((!terminate) && (avail < 2))
 | |
|                         goto done;
 | |
|                     next = ctxt->input->cur[1];
 | |
|                     if (next == '?') {
 | |
|                         if ((!terminate) &&
 | |
|                             (!xmlParseLookupString(ctxt, 2, "?>", 2)))
 | |
|                             goto done;
 | |
|                         xmlParsePI(ctxt);
 | |
|                         if (ctxt->instate == XML_PARSER_EOF)
 | |
|                             goto done;
 | |
|                         break;
 | |
|                     } else if (next == '!') {
 | |
|                         if ((!terminate) && (avail < 3))
 | |
|                             goto done;
 | |
| 
 | |
|                         if (ctxt->input->cur[2] == '-') {
 | |
|                             if ((!terminate) && (avail < 4))
 | |
|                                 goto done;
 | |
|                             if (ctxt->input->cur[3] == '-') {
 | |
|                                 if ((!terminate) &&
 | |
|                                     (!xmlParseLookupString(ctxt, 4, "-->", 3)))
 | |
|                                     goto done;
 | |
|                                 xmlParseComment(ctxt);
 | |
|                                 if (ctxt->instate == XML_PARSER_EOF)
 | |
|                                     goto done;
 | |
|                                 break;
 | |
|                             }
 | |
|                         } else if (ctxt->instate == XML_PARSER_MISC) {
 | |
|                             if ((!terminate) && (avail < 9))
 | |
|                                 goto done;
 | |
|                             if ((ctxt->input->cur[2] == 'D') &&
 | |
|                                 (ctxt->input->cur[3] == 'O') &&
 | |
|                                 (ctxt->input->cur[4] == 'C') &&
 | |
|                                 (ctxt->input->cur[5] == 'T') &&
 | |
|                                 (ctxt->input->cur[6] == 'Y') &&
 | |
|                                 (ctxt->input->cur[7] == 'P') &&
 | |
|                                 (ctxt->input->cur[8] == 'E')) {
 | |
|                                 if ((!terminate) && (!xmlParseLookupGt(ctxt)))
 | |
|                                     goto done;
 | |
|                                 ctxt->inSubset = 1;
 | |
|                                 xmlParseDocTypeDecl(ctxt);
 | |
|                                 if (ctxt->instate == XML_PARSER_EOF)
 | |
|                                     goto done;
 | |
|                                 if (RAW == '[') {
 | |
|                                     ctxt->instate = XML_PARSER_DTD;
 | |
|                                 } else {
 | |
|                                     /*
 | |
|                                      * Create and update the external subset.
 | |
|                                      */
 | |
|                                     ctxt->inSubset = 2;
 | |
|                                     if ((ctxt->sax != NULL) &&
 | |
|                                         (!ctxt->disableSAX) &&
 | |
|                                         (ctxt->sax->externalSubset != NULL))
 | |
|                                         ctxt->sax->externalSubset(
 | |
|                                                 ctxt->userData,
 | |
|                                                 ctxt->intSubName,
 | |
|                                                 ctxt->extSubSystem,
 | |
|                                                 ctxt->extSubURI);
 | |
|                                     ctxt->inSubset = 0;
 | |
|                                     xmlCleanSpecialAttr(ctxt);
 | |
|                                     if (ctxt->instate == XML_PARSER_EOF)
 | |
|                                         goto done;
 | |
|                                     ctxt->instate = XML_PARSER_PROLOG;
 | |
|                                 }
 | |
|                                 break;
 | |
|                             }
 | |
|                         }
 | |
|                     }
 | |
|                 }
 | |
| 
 | |
|                 if (ctxt->instate == XML_PARSER_EPILOG) {
 | |
|                     if (ctxt->errNo == XML_ERR_OK)
 | |
|                         xmlFatalErr(ctxt, XML_ERR_DOCUMENT_END, NULL);
 | |
| 		    ctxt->instate = XML_PARSER_EOF;
 | |
|                     if ((ctxt->sax) && (ctxt->sax->endDocument != NULL))
 | |
|                         ctxt->sax->endDocument(ctxt->userData);
 | |
|                 } else {
 | |
| 		    ctxt->instate = XML_PARSER_START_TAG;
 | |
| 		}
 | |
| 		break;
 | |
|             case XML_PARSER_DTD: {
 | |
|                 if ((!terminate) && (!xmlParseLookupInternalSubset(ctxt)))
 | |
|                     goto done;
 | |
| 		xmlParseInternalSubset(ctxt);
 | |
| 		if (ctxt->instate == XML_PARSER_EOF)
 | |
| 		    goto done;
 | |
| 		ctxt->inSubset = 2;
 | |
| 		if ((ctxt->sax != NULL) && (!ctxt->disableSAX) &&
 | |
| 		    (ctxt->sax->externalSubset != NULL))
 | |
| 		    ctxt->sax->externalSubset(ctxt->userData, ctxt->intSubName,
 | |
| 			    ctxt->extSubSystem, ctxt->extSubURI);
 | |
| 		ctxt->inSubset = 0;
 | |
| 		xmlCleanSpecialAttr(ctxt);
 | |
| 		if (ctxt->instate == XML_PARSER_EOF)
 | |
| 		    goto done;
 | |
| 		ctxt->instate = XML_PARSER_PROLOG;
 | |
|                 break;
 | |
| 	    }
 | |
|             default:
 | |
| 		xmlGenericError(xmlGenericErrorContext,
 | |
| 			"PP: internal error\n");
 | |
| 		ctxt->instate = XML_PARSER_EOF;
 | |
| 		break;
 | |
| 	}
 | |
|     }
 | |
| done:
 | |
|     return(ret);
 | |
| encoding_error:
 | |
|     if (ctxt->input->end - ctxt->input->cur < 4) {
 | |
| 	__xmlErrEncoding(ctxt, XML_ERR_INVALID_CHAR,
 | |
| 		     "Input is not proper UTF-8, indicate encoding !\n",
 | |
| 		     NULL, NULL);
 | |
|     } else {
 | |
|         char buffer[150];
 | |
| 
 | |
| 	snprintf(buffer, 149, "Bytes: 0x%02X 0x%02X 0x%02X 0x%02X\n",
 | |
| 			ctxt->input->cur[0], ctxt->input->cur[1],
 | |
| 			ctxt->input->cur[2], ctxt->input->cur[3]);
 | |
| 	__xmlErrEncoding(ctxt, XML_ERR_INVALID_CHAR,
 | |
| 		     "Input is not proper UTF-8, indicate encoding !\n%s",
 | |
| 		     BAD_CAST buffer, NULL);
 | |
|     }
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseChunk:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @chunk:  an char array
 | |
|  * @size:  the size in byte of the chunk
 | |
|  * @terminate:  last chunk indicator
 | |
|  *
 | |
|  * Parse a Chunk of memory
 | |
|  *
 | |
|  * Returns zero if no error, the xmlParserErrors otherwise.
 | |
|  */
 | |
| int
 | |
| xmlParseChunk(xmlParserCtxtPtr ctxt, const char *chunk, int size,
 | |
|               int terminate) {
 | |
|     int end_in_lf = 0;
 | |
| 
 | |
|     if (ctxt == NULL)
 | |
|         return(XML_ERR_INTERNAL_ERROR);
 | |
|     if ((ctxt->errNo != XML_ERR_OK) && (ctxt->disableSAX == 1))
 | |
|         return(ctxt->errNo);
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return(-1);
 | |
|     if (ctxt->input == NULL)
 | |
|         return(-1);
 | |
| 
 | |
|     ctxt->progressive = 1;
 | |
|     if (ctxt->instate == XML_PARSER_START)
 | |
|         xmlDetectSAX2(ctxt);
 | |
|     if ((size > 0) && (chunk != NULL) && (!terminate) &&
 | |
|         (chunk[size - 1] == '\r')) {
 | |
| 	end_in_lf = 1;
 | |
| 	size--;
 | |
|     }
 | |
| 
 | |
|     if ((size > 0) && (chunk != NULL) && (ctxt->input != NULL) &&
 | |
|         (ctxt->input->buf != NULL) && (ctxt->instate != XML_PARSER_EOF))  {
 | |
| 	size_t pos = ctxt->input->cur - ctxt->input->base;
 | |
| 	int res;
 | |
| 
 | |
| 	res = xmlParserInputBufferPush(ctxt->input->buf, size, chunk);
 | |
|         xmlBufUpdateInput(ctxt->input->buf->buffer, ctxt->input, pos);
 | |
| 	if (res < 0) {
 | |
|             xmlFatalErr(ctxt, ctxt->input->buf->error, NULL);
 | |
| 	    xmlHaltParser(ctxt);
 | |
| 	    return(ctxt->errNo);
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     xmlParseTryOrFinish(ctxt, terminate);
 | |
|     if (ctxt->instate == XML_PARSER_EOF)
 | |
|         return(ctxt->errNo);
 | |
| 
 | |
|     if ((ctxt->input != NULL) &&
 | |
|          (((ctxt->input->end - ctxt->input->cur) > XML_MAX_LOOKUP_LIMIT) ||
 | |
|          ((ctxt->input->cur - ctxt->input->base) > XML_MAX_LOOKUP_LIMIT)) &&
 | |
|         ((ctxt->options & XML_PARSE_HUGE) == 0)) {
 | |
|         xmlFatalErr(ctxt, XML_ERR_INTERNAL_ERROR, "Huge input lookup");
 | |
|         xmlHaltParser(ctxt);
 | |
|     }
 | |
|     if ((ctxt->errNo != XML_ERR_OK) && (ctxt->disableSAX == 1))
 | |
|         return(ctxt->errNo);
 | |
| 
 | |
|     if ((end_in_lf == 1) && (ctxt->input != NULL) &&
 | |
|         (ctxt->input->buf != NULL)) {
 | |
| 	size_t pos = ctxt->input->cur - ctxt->input->base;
 | |
|         int res;
 | |
| 
 | |
| 	res = xmlParserInputBufferPush(ctxt->input->buf, 1, "\r");
 | |
| 	xmlBufUpdateInput(ctxt->input->buf->buffer, ctxt->input, pos);
 | |
|         if (res < 0) {
 | |
|             xmlFatalErr(ctxt, ctxt->input->buf->error, NULL);
 | |
|             xmlHaltParser(ctxt);
 | |
|             return(ctxt->errNo);
 | |
|         }
 | |
|     }
 | |
|     if (terminate) {
 | |
| 	/*
 | |
| 	 * Check for termination
 | |
| 	 */
 | |
|         if ((ctxt->instate != XML_PARSER_EOF) &&
 | |
|             (ctxt->instate != XML_PARSER_EPILOG)) {
 | |
|             if (ctxt->nameNr > 0) {
 | |
|                 const xmlChar *name = ctxt->nameTab[ctxt->nameNr - 1];
 | |
|                 int line = ctxt->pushTab[ctxt->nameNr - 1].line;
 | |
|                 xmlFatalErrMsgStrIntStr(ctxt, XML_ERR_TAG_NOT_FINISHED,
 | |
|                         "Premature end of data in tag %s line %d\n",
 | |
|                         name, line, NULL);
 | |
|             } else if (ctxt->instate == XML_PARSER_START) {
 | |
|                 xmlFatalErr(ctxt, XML_ERR_DOCUMENT_EMPTY, NULL);
 | |
|             } else {
 | |
|                 xmlFatalErrMsg(ctxt, XML_ERR_DOCUMENT_EMPTY,
 | |
|                                "Start tag expected, '<' not found\n");
 | |
|             }
 | |
|         } else if ((ctxt->input->buf != NULL) &&
 | |
|                    (ctxt->input->buf->encoder != NULL) &&
 | |
|                    (!xmlBufIsEmpty(ctxt->input->buf->raw))) {
 | |
|             xmlFatalErrMsg(ctxt, XML_ERR_INVALID_CHAR,
 | |
|                            "Truncated multi-byte sequence at EOF\n");
 | |
|         }
 | |
| 	if (ctxt->instate != XML_PARSER_EOF) {
 | |
| 	    if ((ctxt->sax) && (ctxt->sax->endDocument != NULL))
 | |
| 		ctxt->sax->endDocument(ctxt->userData);
 | |
| 	}
 | |
| 	ctxt->instate = XML_PARSER_EOF;
 | |
|     }
 | |
|     if (ctxt->wellFormed == 0)
 | |
| 	return((xmlParserErrors) ctxt->errNo);
 | |
|     else
 | |
|         return(0);
 | |
| }
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		I/O front end functions to the parser			*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * xmlCreatePushParserCtxt:
 | |
|  * @sax:  a SAX handler
 | |
|  * @user_data:  The user data returned on SAX callbacks
 | |
|  * @chunk:  a pointer to an array of chars
 | |
|  * @size:  number of chars in the array
 | |
|  * @filename:  an optional file name or URI
 | |
|  *
 | |
|  * Create a parser context for using the XML parser in push mode.
 | |
|  * If @buffer and @size are non-NULL, the data is used to detect
 | |
|  * the encoding.  The remaining characters will be parsed so they
 | |
|  * don't need to be fed in again through xmlParseChunk.
 | |
|  * To allow content encoding detection, @size should be >= 4
 | |
|  * The value of @filename is used for fetching external entities
 | |
|  * and error/warning reports.
 | |
|  *
 | |
|  * Returns the new parser context or NULL
 | |
|  */
 | |
| 
 | |
| xmlParserCtxtPtr
 | |
| xmlCreatePushParserCtxt(xmlSAXHandlerPtr sax, void *user_data,
 | |
|                         const char *chunk, int size, const char *filename) {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlParserInputPtr inputStream;
 | |
|     xmlParserInputBufferPtr buf;
 | |
| 
 | |
|     buf = xmlAllocParserInputBuffer(XML_CHAR_ENCODING_NONE);
 | |
|     if (buf == NULL) return(NULL);
 | |
| 
 | |
|     ctxt = xmlNewSAXParserCtxt(sax, user_data);
 | |
|     if (ctxt == NULL) {
 | |
|         xmlErrMemory(NULL, "creating parser: out of memory\n");
 | |
| 	xmlFreeParserInputBuffer(buf);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     ctxt->dictNames = 1;
 | |
|     if (filename == NULL) {
 | |
| 	ctxt->directory = NULL;
 | |
|     } else {
 | |
|         ctxt->directory = xmlParserGetDirectory(filename);
 | |
|     }
 | |
| 
 | |
|     inputStream = xmlNewInputStream(ctxt);
 | |
|     if (inputStream == NULL) {
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	xmlFreeParserInputBuffer(buf);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     if (filename == NULL)
 | |
| 	inputStream->filename = NULL;
 | |
|     else {
 | |
| 	inputStream->filename = (char *)
 | |
| 	    xmlCanonicPath((const xmlChar *) filename);
 | |
| 	if (inputStream->filename == NULL) {
 | |
|             xmlFreeInputStream(inputStream);
 | |
| 	    xmlFreeParserCtxt(ctxt);
 | |
| 	    xmlFreeParserInputBuffer(buf);
 | |
| 	    return(NULL);
 | |
| 	}
 | |
|     }
 | |
|     inputStream->buf = buf;
 | |
|     xmlBufResetInput(inputStream->buf->buffer, inputStream);
 | |
|     inputPush(ctxt, inputStream);
 | |
| 
 | |
|     if ((size != 0) && (chunk != NULL) &&
 | |
|         (ctxt->input != NULL) && (ctxt->input->buf != NULL)) {
 | |
| 	size_t pos = ctxt->input->cur - ctxt->input->base;
 | |
|         int res;
 | |
| 
 | |
| 	res = xmlParserInputBufferPush(ctxt->input->buf, size, chunk);
 | |
|         xmlBufUpdateInput(ctxt->input->buf->buffer, ctxt->input, pos);
 | |
|         if (res < 0) {
 | |
|             xmlFatalErr(ctxt, ctxt->input->buf->error, NULL);
 | |
|             xmlHaltParser(ctxt);
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     return(ctxt);
 | |
| }
 | |
| #endif /* LIBXML_PUSH_ENABLED */
 | |
| 
 | |
| /**
 | |
|  * xmlStopParser:
 | |
|  * @ctxt:  an XML parser context
 | |
|  *
 | |
|  * Blocks further parser processing
 | |
|  */
 | |
| void
 | |
| xmlStopParser(xmlParserCtxtPtr ctxt) {
 | |
|     if (ctxt == NULL)
 | |
|         return;
 | |
|     xmlHaltParser(ctxt);
 | |
|     ctxt->errNo = XML_ERR_USER_STOP;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCreateIOParserCtxt:
 | |
|  * @sax:  a SAX handler
 | |
|  * @user_data:  The user data returned on SAX callbacks
 | |
|  * @ioread:  an I/O read function
 | |
|  * @ioclose:  an I/O close function
 | |
|  * @ioctx:  an I/O handler
 | |
|  * @enc:  the charset encoding if known
 | |
|  *
 | |
|  * Create a parser context for using the XML parser with an existing
 | |
|  * I/O stream
 | |
|  *
 | |
|  * Returns the new parser context or NULL
 | |
|  */
 | |
| xmlParserCtxtPtr
 | |
| xmlCreateIOParserCtxt(xmlSAXHandlerPtr sax, void *user_data,
 | |
| 	xmlInputReadCallback   ioread, xmlInputCloseCallback  ioclose,
 | |
| 	void *ioctx, xmlCharEncoding enc) {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlParserInputPtr inputStream;
 | |
|     xmlParserInputBufferPtr buf;
 | |
| 
 | |
|     if (ioread == NULL) return(NULL);
 | |
| 
 | |
|     buf = xmlParserInputBufferCreateIO(ioread, ioclose, ioctx, enc);
 | |
|     if (buf == NULL) {
 | |
|         if (ioclose != NULL)
 | |
|             ioclose(ioctx);
 | |
|         return (NULL);
 | |
|     }
 | |
| 
 | |
|     ctxt = xmlNewSAXParserCtxt(sax, user_data);
 | |
|     if (ctxt == NULL) {
 | |
| 	xmlFreeParserInputBuffer(buf);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     inputStream = xmlNewIOInputStream(ctxt, buf, enc);
 | |
|     if (inputStream == NULL) {
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     inputPush(ctxt, inputStream);
 | |
| 
 | |
|     return(ctxt);
 | |
| }
 | |
| 
 | |
| #ifdef LIBXML_VALID_ENABLED
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		Front ends when parsing a DTD				*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * xmlIOParseDTD:
 | |
|  * @sax:  the SAX handler block or NULL
 | |
|  * @input:  an Input Buffer
 | |
|  * @enc:  the charset encoding if known
 | |
|  *
 | |
|  * Load and parse a DTD
 | |
|  *
 | |
|  * Returns the resulting xmlDtdPtr or NULL in case of error.
 | |
|  * @input will be freed by the function in any case.
 | |
|  */
 | |
| 
 | |
| xmlDtdPtr
 | |
| xmlIOParseDTD(xmlSAXHandlerPtr sax, xmlParserInputBufferPtr input,
 | |
| 	      xmlCharEncoding enc) {
 | |
|     xmlDtdPtr ret = NULL;
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlParserInputPtr pinput = NULL;
 | |
| 
 | |
|     if (input == NULL)
 | |
| 	return(NULL);
 | |
| 
 | |
|     ctxt = xmlNewSAXParserCtxt(sax, NULL);
 | |
|     if (ctxt == NULL) {
 | |
|         xmlFreeParserInputBuffer(input);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     /* We are loading a DTD */
 | |
|     ctxt->options |= XML_PARSE_DTDLOAD;
 | |
| 
 | |
|     xmlDetectSAX2(ctxt);
 | |
| 
 | |
|     /*
 | |
|      * generate a parser input from the I/O handler
 | |
|      */
 | |
| 
 | |
|     pinput = xmlNewIOInputStream(ctxt, input, XML_CHAR_ENCODING_NONE);
 | |
|     if (pinput == NULL) {
 | |
|         xmlFreeParserInputBuffer(input);
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * plug some encoding conversion routines here.
 | |
|      */
 | |
|     if (xmlPushInput(ctxt, pinput) < 0) {
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     if (enc != XML_CHAR_ENCODING_NONE) {
 | |
|         xmlSwitchEncoding(ctxt, enc);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * let's parse that entity knowing it's an external subset.
 | |
|      */
 | |
|     ctxt->inSubset = 2;
 | |
|     ctxt->myDoc = xmlNewDoc(BAD_CAST "1.0");
 | |
|     if (ctxt->myDoc == NULL) {
 | |
| 	xmlErrMemory(ctxt, "New Doc failed");
 | |
| 	return(NULL);
 | |
|     }
 | |
|     ctxt->myDoc->properties = XML_DOC_INTERNAL;
 | |
|     ctxt->myDoc->extSubset = xmlNewDtd(ctxt->myDoc, BAD_CAST "none",
 | |
| 	                               BAD_CAST "none", BAD_CAST "none");
 | |
| 
 | |
|     xmlDetectEncoding(ctxt);
 | |
| 
 | |
|     xmlParseExternalSubset(ctxt, BAD_CAST "none", BAD_CAST "none");
 | |
| 
 | |
|     if (ctxt->myDoc != NULL) {
 | |
| 	if (ctxt->wellFormed) {
 | |
| 	    ret = ctxt->myDoc->extSubset;
 | |
| 	    ctxt->myDoc->extSubset = NULL;
 | |
| 	    if (ret != NULL) {
 | |
| 		xmlNodePtr tmp;
 | |
| 
 | |
| 		ret->doc = NULL;
 | |
| 		tmp = ret->children;
 | |
| 		while (tmp != NULL) {
 | |
| 		    tmp->doc = NULL;
 | |
| 		    tmp = tmp->next;
 | |
| 		}
 | |
| 	    }
 | |
| 	} else {
 | |
| 	    ret = NULL;
 | |
| 	}
 | |
|         xmlFreeDoc(ctxt->myDoc);
 | |
|         ctxt->myDoc = NULL;
 | |
|     }
 | |
|     xmlFreeParserCtxt(ctxt);
 | |
| 
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlSAXParseDTD:
 | |
|  * @sax:  the SAX handler block
 | |
|  * @ExternalID:  a NAME* containing the External ID of the DTD
 | |
|  * @SystemID:  a NAME* containing the URL to the DTD
 | |
|  *
 | |
|  * DEPRECATED: Don't use.
 | |
|  *
 | |
|  * Load and parse an external subset.
 | |
|  *
 | |
|  * Returns the resulting xmlDtdPtr or NULL in case of error.
 | |
|  */
 | |
| 
 | |
| xmlDtdPtr
 | |
| xmlSAXParseDTD(xmlSAXHandlerPtr sax, const xmlChar *ExternalID,
 | |
|                           const xmlChar *SystemID) {
 | |
|     xmlDtdPtr ret = NULL;
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlParserInputPtr input = NULL;
 | |
|     xmlChar* systemIdCanonic;
 | |
| 
 | |
|     if ((ExternalID == NULL) && (SystemID == NULL)) return(NULL);
 | |
| 
 | |
|     ctxt = xmlNewSAXParserCtxt(sax, NULL);
 | |
|     if (ctxt == NULL) {
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     /* We are loading a DTD */
 | |
|     ctxt->options |= XML_PARSE_DTDLOAD;
 | |
| 
 | |
|     /*
 | |
|      * Canonicalise the system ID
 | |
|      */
 | |
|     systemIdCanonic = xmlCanonicPath(SystemID);
 | |
|     if ((SystemID != NULL) && (systemIdCanonic == NULL)) {
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Ask the Entity resolver to load the damn thing
 | |
|      */
 | |
| 
 | |
|     if ((ctxt->sax != NULL) && (ctxt->sax->resolveEntity != NULL))
 | |
| 	input = ctxt->sax->resolveEntity(ctxt->userData, ExternalID,
 | |
| 	                                 systemIdCanonic);
 | |
|     if (input == NULL) {
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	if (systemIdCanonic != NULL)
 | |
| 	    xmlFree(systemIdCanonic);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * plug some encoding conversion routines here.
 | |
|      */
 | |
|     if (xmlPushInput(ctxt, input) < 0) {
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	if (systemIdCanonic != NULL)
 | |
| 	    xmlFree(systemIdCanonic);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     xmlDetectEncoding(ctxt);
 | |
| 
 | |
|     if (input->filename == NULL)
 | |
| 	input->filename = (char *) systemIdCanonic;
 | |
|     else
 | |
| 	xmlFree(systemIdCanonic);
 | |
| 
 | |
|     /*
 | |
|      * let's parse that entity knowing it's an external subset.
 | |
|      */
 | |
|     ctxt->inSubset = 2;
 | |
|     ctxt->myDoc = xmlNewDoc(BAD_CAST "1.0");
 | |
|     if (ctxt->myDoc == NULL) {
 | |
| 	xmlErrMemory(ctxt, "New Doc failed");
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	return(NULL);
 | |
|     }
 | |
|     ctxt->myDoc->properties = XML_DOC_INTERNAL;
 | |
|     ctxt->myDoc->extSubset = xmlNewDtd(ctxt->myDoc, BAD_CAST "none",
 | |
| 	                               ExternalID, SystemID);
 | |
|     xmlParseExternalSubset(ctxt, ExternalID, SystemID);
 | |
| 
 | |
|     if (ctxt->myDoc != NULL) {
 | |
| 	if (ctxt->wellFormed) {
 | |
| 	    ret = ctxt->myDoc->extSubset;
 | |
| 	    ctxt->myDoc->extSubset = NULL;
 | |
| 	    if (ret != NULL) {
 | |
| 		xmlNodePtr tmp;
 | |
| 
 | |
| 		ret->doc = NULL;
 | |
| 		tmp = ret->children;
 | |
| 		while (tmp != NULL) {
 | |
| 		    tmp->doc = NULL;
 | |
| 		    tmp = tmp->next;
 | |
| 		}
 | |
| 	    }
 | |
| 	} else {
 | |
| 	    ret = NULL;
 | |
| 	}
 | |
|         xmlFreeDoc(ctxt->myDoc);
 | |
|         ctxt->myDoc = NULL;
 | |
|     }
 | |
|     xmlFreeParserCtxt(ctxt);
 | |
| 
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|  * xmlParseDTD:
 | |
|  * @ExternalID:  a NAME* containing the External ID of the DTD
 | |
|  * @SystemID:  a NAME* containing the URL to the DTD
 | |
|  *
 | |
|  * Load and parse an external subset.
 | |
|  *
 | |
|  * Returns the resulting xmlDtdPtr or NULL in case of error.
 | |
|  */
 | |
| 
 | |
| xmlDtdPtr
 | |
| xmlParseDTD(const xmlChar *ExternalID, const xmlChar *SystemID) {
 | |
|     return(xmlSAXParseDTD(NULL, ExternalID, SystemID));
 | |
| }
 | |
| #endif /* LIBXML_VALID_ENABLED */
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		Front ends when parsing an Entity			*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * xmlParseCtxtExternalEntity:
 | |
|  * @ctx:  the existing parsing context
 | |
|  * @URL:  the URL for the entity to load
 | |
|  * @ID:  the System ID for the entity to load
 | |
|  * @lst:  the return value for the set of parsed nodes
 | |
|  *
 | |
|  * Parse an external general entity within an existing parsing context
 | |
|  * An external general parsed entity is well-formed if it matches the
 | |
|  * production labeled extParsedEnt.
 | |
|  *
 | |
|  * [78] extParsedEnt ::= TextDecl? content
 | |
|  *
 | |
|  * Returns 0 if the entity is well formed, -1 in case of args problem and
 | |
|  *    the parser error code otherwise
 | |
|  */
 | |
| 
 | |
| int
 | |
| xmlParseCtxtExternalEntity(xmlParserCtxtPtr ctx, const xmlChar *URL,
 | |
| 	               const xmlChar *ID, xmlNodePtr *lst) {
 | |
|     void *userData;
 | |
| 
 | |
|     if (ctx == NULL) return(-1);
 | |
|     /*
 | |
|      * If the user provided their own SAX callbacks, then reuse the
 | |
|      * userData callback field, otherwise the expected setup in a
 | |
|      * DOM builder is to have userData == ctxt
 | |
|      */
 | |
|     if (ctx->userData == ctx)
 | |
|         userData = NULL;
 | |
|     else
 | |
|         userData = ctx->userData;
 | |
|     return xmlParseExternalEntityPrivate(ctx->myDoc, ctx, ctx->sax,
 | |
|                                          userData, ctx->depth + 1,
 | |
|                                          URL, ID, lst);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseExternalEntityPrivate:
 | |
|  * @doc:  the document the chunk pertains to
 | |
|  * @oldctxt:  the previous parser context if available
 | |
|  * @sax:  the SAX handler block (possibly NULL)
 | |
|  * @user_data:  The user data returned on SAX callbacks (possibly NULL)
 | |
|  * @depth:  Used for loop detection, use 0
 | |
|  * @URL:  the URL for the entity to load
 | |
|  * @ID:  the System ID for the entity to load
 | |
|  * @list:  the return value for the set of parsed nodes
 | |
|  *
 | |
|  * Private version of xmlParseExternalEntity()
 | |
|  *
 | |
|  * Returns 0 if the entity is well formed, -1 in case of args problem and
 | |
|  *    the parser error code otherwise
 | |
|  */
 | |
| 
 | |
| static xmlParserErrors
 | |
| xmlParseExternalEntityPrivate(xmlDocPtr doc, xmlParserCtxtPtr oldctxt,
 | |
| 	              xmlSAXHandlerPtr sax,
 | |
| 		      void *user_data, int depth, const xmlChar *URL,
 | |
| 		      const xmlChar *ID, xmlNodePtr *list) {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlDocPtr newDoc;
 | |
|     xmlNodePtr newRoot;
 | |
|     xmlParserErrors ret = XML_ERR_OK;
 | |
| 
 | |
|     if (((depth > 40) &&
 | |
| 	((oldctxt == NULL) || (oldctxt->options & XML_PARSE_HUGE) == 0)) ||
 | |
| 	(depth > 100)) {
 | |
| 	xmlFatalErrMsg(oldctxt, XML_ERR_ENTITY_LOOP,
 | |
|                        "Maximum entity nesting depth exceeded");
 | |
|         return(XML_ERR_ENTITY_LOOP);
 | |
|     }
 | |
| 
 | |
|     if (list != NULL)
 | |
|         *list = NULL;
 | |
|     if ((URL == NULL) && (ID == NULL))
 | |
| 	return(XML_ERR_INTERNAL_ERROR);
 | |
|     if (doc == NULL)
 | |
| 	return(XML_ERR_INTERNAL_ERROR);
 | |
| 
 | |
|     ctxt = xmlCreateEntityParserCtxtInternal(sax, user_data, URL, ID, NULL,
 | |
|                                              oldctxt);
 | |
|     if (ctxt == NULL) return(XML_WAR_UNDECLARED_ENTITY);
 | |
|     if (oldctxt != NULL) {
 | |
|         ctxt->nbErrors = oldctxt->nbErrors;
 | |
|         ctxt->nbWarnings = oldctxt->nbWarnings;
 | |
|     }
 | |
|     xmlDetectSAX2(ctxt);
 | |
| 
 | |
|     newDoc = xmlNewDoc(BAD_CAST "1.0");
 | |
|     if (newDoc == NULL) {
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	return(XML_ERR_INTERNAL_ERROR);
 | |
|     }
 | |
|     newDoc->properties = XML_DOC_INTERNAL;
 | |
|     if (doc) {
 | |
|         newDoc->intSubset = doc->intSubset;
 | |
|         newDoc->extSubset = doc->extSubset;
 | |
|         if (doc->dict) {
 | |
|             newDoc->dict = doc->dict;
 | |
|             xmlDictReference(newDoc->dict);
 | |
|         }
 | |
|         if (doc->URL != NULL) {
 | |
|             newDoc->URL = xmlStrdup(doc->URL);
 | |
|         }
 | |
|     }
 | |
|     newRoot = xmlNewDocNode(newDoc, NULL, BAD_CAST "pseudoroot", NULL);
 | |
|     if (newRoot == NULL) {
 | |
| 	if (sax != NULL)
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	newDoc->intSubset = NULL;
 | |
| 	newDoc->extSubset = NULL;
 | |
|         xmlFreeDoc(newDoc);
 | |
| 	return(XML_ERR_INTERNAL_ERROR);
 | |
|     }
 | |
|     xmlAddChild((xmlNodePtr) newDoc, newRoot);
 | |
|     nodePush(ctxt, newDoc->children);
 | |
|     if (doc == NULL) {
 | |
|         ctxt->myDoc = newDoc;
 | |
|     } else {
 | |
|         ctxt->myDoc = doc;
 | |
|         newRoot->doc = doc;
 | |
|     }
 | |
| 
 | |
|     xmlDetectEncoding(ctxt);
 | |
| 
 | |
|     /*
 | |
|      * Parse a possible text declaration first
 | |
|      */
 | |
|     if ((CMP5(CUR_PTR, '<', '?', 'x', 'm', 'l')) && (IS_BLANK_CH(NXT(5)))) {
 | |
| 	xmlParseTextDecl(ctxt);
 | |
|         /*
 | |
|          * An XML-1.0 document can't reference an entity not XML-1.0
 | |
|          */
 | |
|         if ((xmlStrEqual(oldctxt->version, BAD_CAST "1.0")) &&
 | |
|             (!xmlStrEqual(ctxt->input->version, BAD_CAST "1.0"))) {
 | |
|             xmlFatalErrMsg(ctxt, XML_ERR_VERSION_MISMATCH,
 | |
|                            "Version mismatch between document and entity\n");
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     ctxt->instate = XML_PARSER_CONTENT;
 | |
|     ctxt->depth = depth;
 | |
|     if (oldctxt != NULL) {
 | |
| 	ctxt->_private = oldctxt->_private;
 | |
| 	ctxt->loadsubset = oldctxt->loadsubset;
 | |
| 	ctxt->validate = oldctxt->validate;
 | |
| 	ctxt->valid = oldctxt->valid;
 | |
| 	ctxt->replaceEntities = oldctxt->replaceEntities;
 | |
|         if (oldctxt->validate) {
 | |
|             ctxt->vctxt.error = oldctxt->vctxt.error;
 | |
|             ctxt->vctxt.warning = oldctxt->vctxt.warning;
 | |
|             ctxt->vctxt.userData = oldctxt->vctxt.userData;
 | |
|             ctxt->vctxt.flags = oldctxt->vctxt.flags;
 | |
|         }
 | |
| 	ctxt->external = oldctxt->external;
 | |
|         if (ctxt->dict) xmlDictFree(ctxt->dict);
 | |
|         ctxt->dict = oldctxt->dict;
 | |
|         ctxt->str_xml = xmlDictLookup(ctxt->dict, BAD_CAST "xml", 3);
 | |
|         ctxt->str_xmlns = xmlDictLookup(ctxt->dict, BAD_CAST "xmlns", 5);
 | |
|         ctxt->str_xml_ns = xmlDictLookup(ctxt->dict, XML_XML_NAMESPACE, 36);
 | |
|         ctxt->dictNames = oldctxt->dictNames;
 | |
|         ctxt->attsDefault = oldctxt->attsDefault;
 | |
|         ctxt->attsSpecial = oldctxt->attsSpecial;
 | |
|         ctxt->linenumbers = oldctxt->linenumbers;
 | |
| 	ctxt->record_info = oldctxt->record_info;
 | |
| 	ctxt->node_seq.maximum = oldctxt->node_seq.maximum;
 | |
| 	ctxt->node_seq.length = oldctxt->node_seq.length;
 | |
| 	ctxt->node_seq.buffer = oldctxt->node_seq.buffer;
 | |
|     } else {
 | |
| 	/*
 | |
| 	 * Doing validity checking on chunk without context
 | |
| 	 * doesn't make sense
 | |
| 	 */
 | |
| 	ctxt->_private = NULL;
 | |
| 	ctxt->validate = 0;
 | |
| 	ctxt->external = 2;
 | |
| 	ctxt->loadsubset = 0;
 | |
|     }
 | |
| 
 | |
|     xmlParseContent(ctxt);
 | |
| 
 | |
|     if ((RAW == '<') && (NXT(1) == '/')) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_NOT_WELL_BALANCED, NULL);
 | |
|     } else if (RAW != 0) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_EXTRA_CONTENT, NULL);
 | |
|     }
 | |
|     if (ctxt->node != newDoc->children) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_NOT_WELL_BALANCED, NULL);
 | |
|     }
 | |
| 
 | |
|     if (!ctxt->wellFormed) {
 | |
| 	ret = (xmlParserErrors)ctxt->errNo;
 | |
|         if (oldctxt != NULL) {
 | |
|             oldctxt->errNo = ctxt->errNo;
 | |
|             oldctxt->wellFormed = 0;
 | |
|             xmlCopyError(&ctxt->lastError, &oldctxt->lastError);
 | |
|         }
 | |
|     } else {
 | |
| 	if (list != NULL) {
 | |
| 	    xmlNodePtr cur;
 | |
| 
 | |
| 	    /*
 | |
| 	     * Return the newly created nodeset after unlinking it from
 | |
| 	     * they pseudo parent.
 | |
| 	     */
 | |
| 	    cur = newDoc->children->children;
 | |
| 	    *list = cur;
 | |
| 	    while (cur != NULL) {
 | |
| 		cur->parent = NULL;
 | |
| 		cur = cur->next;
 | |
| 	    }
 | |
|             newDoc->children->children = NULL;
 | |
| 	}
 | |
| 	ret = XML_ERR_OK;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Also record the size of the entity parsed
 | |
|      */
 | |
|     if (ctxt->input != NULL && oldctxt != NULL) {
 | |
|         unsigned long consumed = ctxt->input->consumed;
 | |
| 
 | |
|         xmlSaturatedAddSizeT(&consumed, ctxt->input->cur - ctxt->input->base);
 | |
| 
 | |
|         xmlSaturatedAdd(&oldctxt->sizeentities, consumed);
 | |
|         xmlSaturatedAdd(&oldctxt->sizeentities, ctxt->sizeentities);
 | |
| 
 | |
|         xmlSaturatedAdd(&oldctxt->sizeentcopy, consumed);
 | |
|         xmlSaturatedAdd(&oldctxt->sizeentcopy, ctxt->sizeentcopy);
 | |
|     }
 | |
| 
 | |
|     if (oldctxt != NULL) {
 | |
|         ctxt->dict = NULL;
 | |
|         ctxt->attsDefault = NULL;
 | |
|         ctxt->attsSpecial = NULL;
 | |
|         oldctxt->nbErrors = ctxt->nbErrors;
 | |
|         oldctxt->nbWarnings = ctxt->nbWarnings;
 | |
|         oldctxt->validate = ctxt->validate;
 | |
|         oldctxt->valid = ctxt->valid;
 | |
|         oldctxt->node_seq.maximum = ctxt->node_seq.maximum;
 | |
|         oldctxt->node_seq.length = ctxt->node_seq.length;
 | |
|         oldctxt->node_seq.buffer = ctxt->node_seq.buffer;
 | |
|     }
 | |
|     ctxt->node_seq.maximum = 0;
 | |
|     ctxt->node_seq.length = 0;
 | |
|     ctxt->node_seq.buffer = NULL;
 | |
|     xmlFreeParserCtxt(ctxt);
 | |
|     newDoc->intSubset = NULL;
 | |
|     newDoc->extSubset = NULL;
 | |
|     xmlFreeDoc(newDoc);
 | |
| 
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
| /**
 | |
|  * xmlParseExternalEntity:
 | |
|  * @doc:  the document the chunk pertains to
 | |
|  * @sax:  the SAX handler block (possibly NULL)
 | |
|  * @user_data:  The user data returned on SAX callbacks (possibly NULL)
 | |
|  * @depth:  Used for loop detection, use 0
 | |
|  * @URL:  the URL for the entity to load
 | |
|  * @ID:  the System ID for the entity to load
 | |
|  * @lst:  the return value for the set of parsed nodes
 | |
|  *
 | |
|  * Parse an external general entity
 | |
|  * An external general parsed entity is well-formed if it matches the
 | |
|  * production labeled extParsedEnt.
 | |
|  *
 | |
|  * [78] extParsedEnt ::= TextDecl? content
 | |
|  *
 | |
|  * Returns 0 if the entity is well formed, -1 in case of args problem and
 | |
|  *    the parser error code otherwise
 | |
|  */
 | |
| 
 | |
| int
 | |
| xmlParseExternalEntity(xmlDocPtr doc, xmlSAXHandlerPtr sax, void *user_data,
 | |
| 	  int depth, const xmlChar *URL, const xmlChar *ID, xmlNodePtr *lst) {
 | |
|     return(xmlParseExternalEntityPrivate(doc, NULL, sax, user_data, depth, URL,
 | |
| 		                       ID, lst));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseBalancedChunkMemory:
 | |
|  * @doc:  the document the chunk pertains to (must not be NULL)
 | |
|  * @sax:  the SAX handler block (possibly NULL)
 | |
|  * @user_data:  The user data returned on SAX callbacks (possibly NULL)
 | |
|  * @depth:  Used for loop detection, use 0
 | |
|  * @string:  the input string in UTF8 or ISO-Latin (zero terminated)
 | |
|  * @lst:  the return value for the set of parsed nodes
 | |
|  *
 | |
|  * Parse a well-balanced chunk of an XML document
 | |
|  * called by the parser
 | |
|  * The allowed sequence for the Well Balanced Chunk is the one defined by
 | |
|  * the content production in the XML grammar:
 | |
|  *
 | |
|  * [43] content ::= (element | CharData | Reference | CDSect | PI | Comment)*
 | |
|  *
 | |
|  * Returns 0 if the chunk is well balanced, -1 in case of args problem and
 | |
|  *    the parser error code otherwise
 | |
|  */
 | |
| 
 | |
| int
 | |
| xmlParseBalancedChunkMemory(xmlDocPtr doc, xmlSAXHandlerPtr sax,
 | |
|      void *user_data, int depth, const xmlChar *string, xmlNodePtr *lst) {
 | |
|     return xmlParseBalancedChunkMemoryRecover( doc, sax, user_data,
 | |
|                                                 depth, string, lst, 0 );
 | |
| }
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
| 
 | |
| /**
 | |
|  * xmlParseBalancedChunkMemoryInternal:
 | |
|  * @oldctxt:  the existing parsing context
 | |
|  * @string:  the input string in UTF8 or ISO-Latin (zero terminated)
 | |
|  * @user_data:  the user data field for the parser context
 | |
|  * @lst:  the return value for the set of parsed nodes
 | |
|  *
 | |
|  *
 | |
|  * Parse a well-balanced chunk of an XML document
 | |
|  * called by the parser
 | |
|  * The allowed sequence for the Well Balanced Chunk is the one defined by
 | |
|  * the content production in the XML grammar:
 | |
|  *
 | |
|  * [43] content ::= (element | CharData | Reference | CDSect | PI | Comment)*
 | |
|  *
 | |
|  * Returns XML_ERR_OK if the chunk is well balanced, and the parser
 | |
|  * error code otherwise
 | |
|  *
 | |
|  * In case recover is set to 1, the nodelist will not be empty even if
 | |
|  * the parsed chunk is not well balanced.
 | |
|  */
 | |
| static xmlParserErrors
 | |
| xmlParseBalancedChunkMemoryInternal(xmlParserCtxtPtr oldctxt,
 | |
| 	const xmlChar *string, void *user_data, xmlNodePtr *lst) {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlDocPtr newDoc = NULL;
 | |
|     xmlNodePtr newRoot;
 | |
|     xmlSAXHandlerPtr oldsax = NULL;
 | |
|     xmlNodePtr content = NULL;
 | |
|     xmlNodePtr last = NULL;
 | |
|     xmlParserErrors ret = XML_ERR_OK;
 | |
| #if 0
 | |
|     unsigned i;
 | |
| #endif
 | |
| 
 | |
|     if (((oldctxt->depth > 40) && ((oldctxt->options & XML_PARSE_HUGE) == 0)) ||
 | |
|         (oldctxt->depth >  100)) {
 | |
| 	xmlFatalErrMsg(oldctxt, XML_ERR_ENTITY_LOOP,
 | |
|                        "Maximum entity nesting depth exceeded");
 | |
| 	return(XML_ERR_ENTITY_LOOP);
 | |
|     }
 | |
| 
 | |
| 
 | |
|     if (lst != NULL)
 | |
|         *lst = NULL;
 | |
|     if (string == NULL)
 | |
|         return(XML_ERR_INTERNAL_ERROR);
 | |
| 
 | |
|     ctxt = xmlCreateDocParserCtxt(string);
 | |
|     if (ctxt == NULL) return(XML_WAR_UNDECLARED_ENTITY);
 | |
|     ctxt->nbErrors = oldctxt->nbErrors;
 | |
|     ctxt->nbWarnings = oldctxt->nbWarnings;
 | |
|     if (user_data != NULL)
 | |
| 	ctxt->userData = user_data;
 | |
|     else
 | |
| 	ctxt->userData = ctxt;
 | |
|     if (ctxt->dict != NULL) xmlDictFree(ctxt->dict);
 | |
|     ctxt->dict = oldctxt->dict;
 | |
|     ctxt->input_id = oldctxt->input_id;
 | |
|     ctxt->str_xml = xmlDictLookup(ctxt->dict, BAD_CAST "xml", 3);
 | |
|     ctxt->str_xmlns = xmlDictLookup(ctxt->dict, BAD_CAST "xmlns", 5);
 | |
|     ctxt->str_xml_ns = xmlDictLookup(ctxt->dict, XML_XML_NAMESPACE, 36);
 | |
| 
 | |
|     /*
 | |
|      * Propagate namespaces down the entity
 | |
|      *
 | |
|      * This is disabled for now. The pre-2.12 code was already broken
 | |
|      * since the SAX handler was using xmlSearchNs which didn't see the
 | |
|      * namespaces added here.
 | |
|      *
 | |
|      * Making entities and namespaces work correctly requires additional
 | |
|      * changes, see xmlParseReference.
 | |
|      */
 | |
| #if 0
 | |
|     for (i = 0; i < oldctxt->nsdb->hashSize; i++) {
 | |
|         xmlParserNsBucket *bucket = &oldctxt->nsdb->hash[i];
 | |
|         xmlHashedString hprefix, huri;
 | |
|         const xmlChar **ns;
 | |
|         xmlParserNsExtra *extra;
 | |
|         unsigned nsIndex;
 | |
| 
 | |
|         if ((bucket->hashValue != 0) &&
 | |
|             (bucket->index != INT_MAX)) {
 | |
|             nsIndex = bucket->index;
 | |
|             ns = &oldctxt->nsTab[nsIndex * 2];
 | |
|             extra = &oldctxt->nsdb->extra[nsIndex];
 | |
| 
 | |
|             hprefix.name = ns[0];
 | |
|             hprefix.hashValue = bucket->hashValue;
 | |
|             huri.name = ns[1];
 | |
|             huri.hashValue = extra->uriHashValue;
 | |
|             xmlParserNsPush(ctxt, &hprefix, &huri, extra->saxData, 0);
 | |
|         }
 | |
|     }
 | |
| #endif
 | |
| 
 | |
|     oldsax = ctxt->sax;
 | |
|     ctxt->sax = oldctxt->sax;
 | |
|     xmlDetectSAX2(ctxt);
 | |
|     ctxt->replaceEntities = oldctxt->replaceEntities;
 | |
|     ctxt->options = oldctxt->options;
 | |
| 
 | |
|     ctxt->_private = oldctxt->_private;
 | |
|     if (oldctxt->myDoc == NULL) {
 | |
| 	newDoc = xmlNewDoc(BAD_CAST "1.0");
 | |
| 	if (newDoc == NULL) {
 | |
|             ret = XML_ERR_INTERNAL_ERROR;
 | |
|             goto error;
 | |
| 	}
 | |
| 	newDoc->properties = XML_DOC_INTERNAL;
 | |
| 	newDoc->dict = ctxt->dict;
 | |
| 	xmlDictReference(newDoc->dict);
 | |
| 	ctxt->myDoc = newDoc;
 | |
|     } else {
 | |
| 	ctxt->myDoc = oldctxt->myDoc;
 | |
|         content = ctxt->myDoc->children;
 | |
| 	last = ctxt->myDoc->last;
 | |
|     }
 | |
|     newRoot = xmlNewDocNode(ctxt->myDoc, NULL, BAD_CAST "pseudoroot", NULL);
 | |
|     if (newRoot == NULL) {
 | |
|         ret = XML_ERR_INTERNAL_ERROR;
 | |
|         goto error;
 | |
|     }
 | |
|     ctxt->myDoc->children = NULL;
 | |
|     ctxt->myDoc->last = NULL;
 | |
|     xmlAddChild((xmlNodePtr) ctxt->myDoc, newRoot);
 | |
|     nodePush(ctxt, ctxt->myDoc->children);
 | |
|     ctxt->instate = XML_PARSER_CONTENT;
 | |
|     ctxt->depth = oldctxt->depth;
 | |
| 
 | |
|     ctxt->validate = 0;
 | |
|     ctxt->loadsubset = oldctxt->loadsubset;
 | |
|     if ((oldctxt->validate) || (oldctxt->replaceEntities != 0)) {
 | |
| 	/*
 | |
| 	 * ID/IDREF registration will be done in xmlValidateElement below
 | |
| 	 */
 | |
| 	ctxt->loadsubset |= XML_SKIP_IDS;
 | |
|     }
 | |
|     ctxt->dictNames = oldctxt->dictNames;
 | |
|     ctxt->attsDefault = oldctxt->attsDefault;
 | |
|     ctxt->attsSpecial = oldctxt->attsSpecial;
 | |
| 
 | |
|     xmlParseContent(ctxt);
 | |
|     if ((RAW == '<') && (NXT(1) == '/')) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_NOT_WELL_BALANCED, NULL);
 | |
|     } else if (RAW != 0) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_EXTRA_CONTENT, NULL);
 | |
|     }
 | |
|     if (ctxt->node != ctxt->myDoc->children) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_NOT_WELL_BALANCED, NULL);
 | |
|     }
 | |
| 
 | |
|     if (!ctxt->wellFormed) {
 | |
| 	ret = (xmlParserErrors)ctxt->errNo;
 | |
|         oldctxt->errNo = ctxt->errNo;
 | |
|         oldctxt->wellFormed = 0;
 | |
|         xmlCopyError(&ctxt->lastError, &oldctxt->lastError);
 | |
|     } else {
 | |
|         ret = XML_ERR_OK;
 | |
|     }
 | |
| 
 | |
|     if ((lst != NULL) && (ret == XML_ERR_OK)) {
 | |
| 	xmlNodePtr cur;
 | |
| 
 | |
| 	/*
 | |
| 	 * Return the newly created nodeset after unlinking it from
 | |
| 	 * they pseudo parent.
 | |
| 	 */
 | |
| 	cur = ctxt->myDoc->children->children;
 | |
| 	*lst = cur;
 | |
| 	while (cur != NULL) {
 | |
| #ifdef LIBXML_VALID_ENABLED
 | |
| 	    if ((oldctxt->validate) && (oldctxt->wellFormed) &&
 | |
| 		(oldctxt->myDoc) && (oldctxt->myDoc->intSubset) &&
 | |
| 		(cur->type == XML_ELEMENT_NODE)) {
 | |
| 		oldctxt->valid &= xmlValidateElement(&oldctxt->vctxt,
 | |
| 			oldctxt->myDoc, cur);
 | |
| 	    }
 | |
| #endif /* LIBXML_VALID_ENABLED */
 | |
| 	    cur->parent = NULL;
 | |
| 	    cur = cur->next;
 | |
| 	}
 | |
| 	ctxt->myDoc->children->children = NULL;
 | |
|     }
 | |
|     if (ctxt->myDoc != NULL) {
 | |
| 	xmlFreeNode(ctxt->myDoc->children);
 | |
|         ctxt->myDoc->children = content;
 | |
|         ctxt->myDoc->last = last;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Also record the size of the entity parsed
 | |
|      */
 | |
|     if (ctxt->input != NULL && oldctxt != NULL) {
 | |
|         unsigned long consumed = ctxt->input->consumed;
 | |
| 
 | |
|         xmlSaturatedAddSizeT(&consumed, ctxt->input->cur - ctxt->input->base);
 | |
| 
 | |
|         xmlSaturatedAdd(&oldctxt->sizeentcopy, consumed);
 | |
|         xmlSaturatedAdd(&oldctxt->sizeentcopy, ctxt->sizeentcopy);
 | |
|     }
 | |
| 
 | |
|     oldctxt->nbErrors = ctxt->nbErrors;
 | |
|     oldctxt->nbWarnings = ctxt->nbWarnings;
 | |
| 
 | |
| error:
 | |
|     ctxt->sax = oldsax;
 | |
|     ctxt->dict = NULL;
 | |
|     ctxt->attsDefault = NULL;
 | |
|     ctxt->attsSpecial = NULL;
 | |
|     xmlFreeParserCtxt(ctxt);
 | |
|     if (newDoc != NULL) {
 | |
| 	xmlFreeDoc(newDoc);
 | |
|     }
 | |
| 
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseInNodeContext:
 | |
|  * @node:  the context node
 | |
|  * @data:  the input string
 | |
|  * @datalen:  the input string length in bytes
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  * @lst:  the return value for the set of parsed nodes
 | |
|  *
 | |
|  * Parse a well-balanced chunk of an XML document
 | |
|  * within the context (DTD, namespaces, etc ...) of the given node.
 | |
|  *
 | |
|  * The allowed sequence for the data is a Well Balanced Chunk defined by
 | |
|  * the content production in the XML grammar:
 | |
|  *
 | |
|  * [43] content ::= (element | CharData | Reference | CDSect | PI | Comment)*
 | |
|  *
 | |
|  * Returns XML_ERR_OK if the chunk is well balanced, and the parser
 | |
|  * error code otherwise
 | |
|  */
 | |
| xmlParserErrors
 | |
| xmlParseInNodeContext(xmlNodePtr node, const char *data, int datalen,
 | |
|                       int options, xmlNodePtr *lst) {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlDocPtr doc = NULL;
 | |
|     xmlNodePtr fake, cur;
 | |
|     int nsnr = 0;
 | |
| 
 | |
|     xmlParserErrors ret = XML_ERR_OK;
 | |
| 
 | |
|     /*
 | |
|      * check all input parameters, grab the document
 | |
|      */
 | |
|     if ((lst == NULL) || (node == NULL) || (data == NULL) || (datalen < 0))
 | |
|         return(XML_ERR_INTERNAL_ERROR);
 | |
|     switch (node->type) {
 | |
|         case XML_ELEMENT_NODE:
 | |
|         case XML_ATTRIBUTE_NODE:
 | |
|         case XML_TEXT_NODE:
 | |
|         case XML_CDATA_SECTION_NODE:
 | |
|         case XML_ENTITY_REF_NODE:
 | |
|         case XML_PI_NODE:
 | |
|         case XML_COMMENT_NODE:
 | |
|         case XML_DOCUMENT_NODE:
 | |
|         case XML_HTML_DOCUMENT_NODE:
 | |
| 	    break;
 | |
| 	default:
 | |
| 	    return(XML_ERR_INTERNAL_ERROR);
 | |
| 
 | |
|     }
 | |
|     while ((node != NULL) && (node->type != XML_ELEMENT_NODE) &&
 | |
|            (node->type != XML_DOCUMENT_NODE) &&
 | |
| 	   (node->type != XML_HTML_DOCUMENT_NODE))
 | |
| 	node = node->parent;
 | |
|     if (node == NULL)
 | |
| 	return(XML_ERR_INTERNAL_ERROR);
 | |
|     if (node->type == XML_ELEMENT_NODE)
 | |
| 	doc = node->doc;
 | |
|     else
 | |
|         doc = (xmlDocPtr) node;
 | |
|     if (doc == NULL)
 | |
| 	return(XML_ERR_INTERNAL_ERROR);
 | |
| 
 | |
|     /*
 | |
|      * allocate a context and set-up everything not related to the
 | |
|      * node position in the tree
 | |
|      */
 | |
|     if (doc->type == XML_DOCUMENT_NODE)
 | |
| 	ctxt = xmlCreateMemoryParserCtxt((char *) data, datalen);
 | |
| #ifdef LIBXML_HTML_ENABLED
 | |
|     else if (doc->type == XML_HTML_DOCUMENT_NODE) {
 | |
| 	ctxt = htmlCreateMemoryParserCtxt((char *) data, datalen);
 | |
|         /*
 | |
|          * When parsing in context, it makes no sense to add implied
 | |
|          * elements like html/body/etc...
 | |
|          */
 | |
|         options |= HTML_PARSE_NOIMPLIED;
 | |
|     }
 | |
| #endif
 | |
|     else
 | |
|         return(XML_ERR_INTERNAL_ERROR);
 | |
| 
 | |
|     if (ctxt == NULL)
 | |
|         return(XML_ERR_NO_MEMORY);
 | |
| 
 | |
|     /*
 | |
|      * Use input doc's dict if present, else assure XML_PARSE_NODICT is set.
 | |
|      * We need a dictionary for xmlDetectSAX2, so if there's no doc dict
 | |
|      * we must wait until the last moment to free the original one.
 | |
|      */
 | |
|     if (doc->dict != NULL) {
 | |
|         if (ctxt->dict != NULL)
 | |
| 	    xmlDictFree(ctxt->dict);
 | |
| 	ctxt->dict = doc->dict;
 | |
|     } else
 | |
|         options |= XML_PARSE_NODICT;
 | |
| 
 | |
|     if (doc->encoding != NULL) {
 | |
|         xmlCharEncodingHandlerPtr hdlr;
 | |
| 
 | |
|         hdlr = xmlFindCharEncodingHandler((const char *) doc->encoding);
 | |
|         if (hdlr != NULL) {
 | |
|             xmlSwitchToEncoding(ctxt, hdlr);
 | |
| 	} else {
 | |
|             return(XML_ERR_UNSUPPORTED_ENCODING);
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     xmlCtxtUseOptionsInternal(ctxt, options, NULL);
 | |
|     xmlDetectSAX2(ctxt);
 | |
|     ctxt->myDoc = doc;
 | |
|     /* parsing in context, i.e. as within existing content */
 | |
|     ctxt->input_id = 2;
 | |
|     ctxt->instate = XML_PARSER_CONTENT;
 | |
| 
 | |
|     fake = xmlNewDocComment(node->doc, NULL);
 | |
|     if (fake == NULL) {
 | |
|         xmlFreeParserCtxt(ctxt);
 | |
| 	return(XML_ERR_NO_MEMORY);
 | |
|     }
 | |
|     xmlAddChild(node, fake);
 | |
| 
 | |
|     if (node->type == XML_ELEMENT_NODE) {
 | |
| 	nodePush(ctxt, node);
 | |
| 	/*
 | |
| 	 * initialize the SAX2 namespaces stack
 | |
| 	 */
 | |
| 	cur = node;
 | |
| 	while ((cur != NULL) && (cur->type == XML_ELEMENT_NODE)) {
 | |
| 	    xmlNsPtr ns = cur->nsDef;
 | |
|             xmlHashedString hprefix, huri;
 | |
| 
 | |
| 	    while (ns != NULL) {
 | |
|                 hprefix = xmlDictLookupHashed(ctxt->dict, ns->prefix, -1);
 | |
|                 huri = xmlDictLookupHashed(ctxt->dict, ns->href, -1);
 | |
|                 if (xmlParserNsPush(ctxt, &hprefix, &huri, ns, 1) > 0)
 | |
|                     nsnr++;
 | |
| 		ns = ns->next;
 | |
| 	    }
 | |
| 	    cur = cur->parent;
 | |
| 	}
 | |
|     }
 | |
| 
 | |
|     if ((ctxt->validate) || (ctxt->replaceEntities != 0)) {
 | |
| 	/*
 | |
| 	 * ID/IDREF registration will be done in xmlValidateElement below
 | |
| 	 */
 | |
| 	ctxt->loadsubset |= XML_SKIP_IDS;
 | |
|     }
 | |
| 
 | |
| #ifdef LIBXML_HTML_ENABLED
 | |
|     if (doc->type == XML_HTML_DOCUMENT_NODE)
 | |
|         __htmlParseContent(ctxt);
 | |
|     else
 | |
| #endif
 | |
| 	xmlParseContent(ctxt);
 | |
| 
 | |
|     xmlParserNsPop(ctxt, nsnr);
 | |
|     if ((RAW == '<') && (NXT(1) == '/')) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_NOT_WELL_BALANCED, NULL);
 | |
|     } else if (RAW != 0) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_EXTRA_CONTENT, NULL);
 | |
|     }
 | |
|     if ((ctxt->node != NULL) && (ctxt->node != node)) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_NOT_WELL_BALANCED, NULL);
 | |
| 	ctxt->wellFormed = 0;
 | |
|     }
 | |
| 
 | |
|     if (!ctxt->wellFormed) {
 | |
|         if (ctxt->errNo == 0)
 | |
| 	    ret = XML_ERR_INTERNAL_ERROR;
 | |
| 	else
 | |
| 	    ret = (xmlParserErrors)ctxt->errNo;
 | |
|     } else {
 | |
|         ret = XML_ERR_OK;
 | |
|     }
 | |
| 
 | |
|     /*
 | |
|      * Return the newly created nodeset after unlinking it from
 | |
|      * the pseudo sibling.
 | |
|      */
 | |
| 
 | |
|     cur = fake->next;
 | |
|     fake->next = NULL;
 | |
|     node->last = fake;
 | |
| 
 | |
|     if (cur != NULL) {
 | |
| 	cur->prev = NULL;
 | |
|     }
 | |
| 
 | |
|     *lst = cur;
 | |
| 
 | |
|     while (cur != NULL) {
 | |
| 	cur->parent = NULL;
 | |
| 	cur = cur->next;
 | |
|     }
 | |
| 
 | |
|     xmlUnlinkNode(fake);
 | |
|     xmlFreeNode(fake);
 | |
| 
 | |
| 
 | |
|     if (ret != XML_ERR_OK) {
 | |
|         xmlFreeNodeList(*lst);
 | |
| 	*lst = NULL;
 | |
|     }
 | |
| 
 | |
|     if (doc->dict != NULL)
 | |
|         ctxt->dict = NULL;
 | |
|     xmlFreeParserCtxt(ctxt);
 | |
| 
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
| /**
 | |
|  * xmlParseBalancedChunkMemoryRecover:
 | |
|  * @doc:  the document the chunk pertains to (must not be NULL)
 | |
|  * @sax:  the SAX handler block (possibly NULL)
 | |
|  * @user_data:  The user data returned on SAX callbacks (possibly NULL)
 | |
|  * @depth:  Used for loop detection, use 0
 | |
|  * @string:  the input string in UTF8 or ISO-Latin (zero terminated)
 | |
|  * @lst:  the return value for the set of parsed nodes
 | |
|  * @recover: return nodes even if the data is broken (use 0)
 | |
|  *
 | |
|  *
 | |
|  * Parse a well-balanced chunk of an XML document
 | |
|  * called by the parser
 | |
|  * The allowed sequence for the Well Balanced Chunk is the one defined by
 | |
|  * the content production in the XML grammar:
 | |
|  *
 | |
|  * [43] content ::= (element | CharData | Reference | CDSect | PI | Comment)*
 | |
|  *
 | |
|  * Returns 0 if the chunk is well balanced, -1 in case of args problem and
 | |
|  *    the parser error code otherwise
 | |
|  *
 | |
|  * In case recover is set to 1, the nodelist will not be empty even if
 | |
|  * the parsed chunk is not well balanced, assuming the parsing succeeded to
 | |
|  * some extent.
 | |
|  */
 | |
| int
 | |
| xmlParseBalancedChunkMemoryRecover(xmlDocPtr doc, xmlSAXHandlerPtr sax,
 | |
|      void *user_data, int depth, const xmlChar *string, xmlNodePtr *lst,
 | |
|      int recover) {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlDocPtr newDoc;
 | |
|     xmlSAXHandlerPtr oldsax = NULL;
 | |
|     xmlNodePtr content, newRoot;
 | |
|     int ret = 0;
 | |
| 
 | |
|     if (depth > 40) {
 | |
| 	return(XML_ERR_ENTITY_LOOP);
 | |
|     }
 | |
| 
 | |
| 
 | |
|     if (lst != NULL)
 | |
|         *lst = NULL;
 | |
|     if (string == NULL)
 | |
|         return(-1);
 | |
| 
 | |
|     ctxt = xmlCreateDocParserCtxt(string);
 | |
|     if (ctxt == NULL) return(-1);
 | |
|     ctxt->userData = ctxt;
 | |
|     if (sax != NULL) {
 | |
| 	oldsax = ctxt->sax;
 | |
|         ctxt->sax = sax;
 | |
| 	if (user_data != NULL)
 | |
| 	    ctxt->userData = user_data;
 | |
|     }
 | |
|     newDoc = xmlNewDoc(BAD_CAST "1.0");
 | |
|     if (newDoc == NULL) {
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	return(-1);
 | |
|     }
 | |
|     newDoc->properties = XML_DOC_INTERNAL;
 | |
|     if ((doc != NULL) && (doc->dict != NULL)) {
 | |
|         xmlDictFree(ctxt->dict);
 | |
| 	ctxt->dict = doc->dict;
 | |
| 	xmlDictReference(ctxt->dict);
 | |
| 	ctxt->str_xml = xmlDictLookup(ctxt->dict, BAD_CAST "xml", 3);
 | |
| 	ctxt->str_xmlns = xmlDictLookup(ctxt->dict, BAD_CAST "xmlns", 5);
 | |
| 	ctxt->str_xml_ns = xmlDictLookup(ctxt->dict, XML_XML_NAMESPACE, 36);
 | |
| 	ctxt->dictNames = 1;
 | |
|     } else {
 | |
| 	xmlCtxtUseOptionsInternal(ctxt, XML_PARSE_NODICT, NULL);
 | |
|     }
 | |
|     /* doc == NULL is only supported for historic reasons */
 | |
|     if (doc != NULL) {
 | |
| 	newDoc->intSubset = doc->intSubset;
 | |
| 	newDoc->extSubset = doc->extSubset;
 | |
|     }
 | |
|     newRoot = xmlNewDocNode(newDoc, NULL, BAD_CAST "pseudoroot", NULL);
 | |
|     if (newRoot == NULL) {
 | |
| 	if (sax != NULL)
 | |
| 	    ctxt->sax = oldsax;
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	newDoc->intSubset = NULL;
 | |
| 	newDoc->extSubset = NULL;
 | |
|         xmlFreeDoc(newDoc);
 | |
| 	return(-1);
 | |
|     }
 | |
|     xmlAddChild((xmlNodePtr) newDoc, newRoot);
 | |
|     nodePush(ctxt, newRoot);
 | |
|     /* doc == NULL is only supported for historic reasons */
 | |
|     if (doc == NULL) {
 | |
| 	ctxt->myDoc = newDoc;
 | |
|     } else {
 | |
| 	ctxt->myDoc = newDoc;
 | |
| 	newDoc->children->doc = doc;
 | |
| 	/* Ensure that doc has XML spec namespace */
 | |
| 	xmlSearchNsByHref(doc, (xmlNodePtr)doc, XML_XML_NAMESPACE);
 | |
| 	newDoc->oldNs = doc->oldNs;
 | |
|     }
 | |
|     ctxt->instate = XML_PARSER_CONTENT;
 | |
|     ctxt->input_id = 2;
 | |
|     ctxt->depth = depth;
 | |
| 
 | |
|     /*
 | |
|      * Doing validity checking on chunk doesn't make sense
 | |
|      */
 | |
|     ctxt->validate = 0;
 | |
|     ctxt->loadsubset = 0;
 | |
|     xmlDetectSAX2(ctxt);
 | |
| 
 | |
|     if ( doc != NULL ){
 | |
|         content = doc->children;
 | |
|         doc->children = NULL;
 | |
|         xmlParseContent(ctxt);
 | |
|         doc->children = content;
 | |
|     }
 | |
|     else {
 | |
|         xmlParseContent(ctxt);
 | |
|     }
 | |
|     if ((RAW == '<') && (NXT(1) == '/')) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_NOT_WELL_BALANCED, NULL);
 | |
|     } else if (RAW != 0) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_EXTRA_CONTENT, NULL);
 | |
|     }
 | |
|     if (ctxt->node != newDoc->children) {
 | |
| 	xmlFatalErr(ctxt, XML_ERR_NOT_WELL_BALANCED, NULL);
 | |
|     }
 | |
| 
 | |
|     if (!ctxt->wellFormed) {
 | |
|         if (ctxt->errNo == 0)
 | |
| 	    ret = 1;
 | |
| 	else
 | |
| 	    ret = ctxt->errNo;
 | |
|     } else {
 | |
|       ret = 0;
 | |
|     }
 | |
| 
 | |
|     if ((lst != NULL) && ((ret == 0) || (recover == 1))) {
 | |
| 	xmlNodePtr cur;
 | |
| 
 | |
| 	/*
 | |
| 	 * Return the newly created nodeset after unlinking it from
 | |
| 	 * they pseudo parent.
 | |
| 	 */
 | |
| 	cur = newDoc->children->children;
 | |
| 	*lst = cur;
 | |
| 	while (cur != NULL) {
 | |
| 	    xmlSetTreeDoc(cur, doc);
 | |
| 	    cur->parent = NULL;
 | |
| 	    cur = cur->next;
 | |
| 	}
 | |
| 	newDoc->children->children = NULL;
 | |
|     }
 | |
| 
 | |
|     if (sax != NULL)
 | |
| 	ctxt->sax = oldsax;
 | |
|     xmlFreeParserCtxt(ctxt);
 | |
|     newDoc->intSubset = NULL;
 | |
|     newDoc->extSubset = NULL;
 | |
|     /* This leaks the namespace list if doc == NULL */
 | |
|     newDoc->oldNs = NULL;
 | |
|     xmlFreeDoc(newDoc);
 | |
| 
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlSAXParseEntity:
 | |
|  * @sax:  the SAX handler block
 | |
|  * @filename:  the filename
 | |
|  *
 | |
|  * DEPRECATED: Don't use.
 | |
|  *
 | |
|  * parse an XML external entity out of context and build a tree.
 | |
|  * It use the given SAX function block to handle the parsing callback.
 | |
|  * If sax is NULL, fallback to the default DOM tree building routines.
 | |
|  *
 | |
|  * [78] extParsedEnt ::= TextDecl? content
 | |
|  *
 | |
|  * This correspond to a "Well Balanced" chunk
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| 
 | |
| xmlDocPtr
 | |
| xmlSAXParseEntity(xmlSAXHandlerPtr sax, const char *filename) {
 | |
|     xmlDocPtr ret;
 | |
|     xmlParserCtxtPtr ctxt;
 | |
| 
 | |
|     ctxt = xmlCreateFileParserCtxt(filename);
 | |
|     if (ctxt == NULL) {
 | |
| 	return(NULL);
 | |
|     }
 | |
|     if (sax != NULL) {
 | |
| 	if (ctxt->sax != NULL)
 | |
| 	    xmlFree(ctxt->sax);
 | |
|         ctxt->sax = sax;
 | |
|         ctxt->userData = NULL;
 | |
|     }
 | |
| 
 | |
|     xmlParseExtParsedEnt(ctxt);
 | |
| 
 | |
|     if (ctxt->wellFormed)
 | |
| 	ret = ctxt->myDoc;
 | |
|     else {
 | |
|         ret = NULL;
 | |
|         xmlFreeDoc(ctxt->myDoc);
 | |
|         ctxt->myDoc = NULL;
 | |
|     }
 | |
|     if (sax != NULL)
 | |
|         ctxt->sax = NULL;
 | |
|     xmlFreeParserCtxt(ctxt);
 | |
| 
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseEntity:
 | |
|  * @filename:  the filename
 | |
|  *
 | |
|  * parse an XML external entity out of context and build a tree.
 | |
|  *
 | |
|  * [78] extParsedEnt ::= TextDecl? content
 | |
|  *
 | |
|  * This correspond to a "Well Balanced" chunk
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| 
 | |
| xmlDocPtr
 | |
| xmlParseEntity(const char *filename) {
 | |
|     return(xmlSAXParseEntity(NULL, filename));
 | |
| }
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
| 
 | |
| /**
 | |
|  * xmlCreateEntityParserCtxtInternal:
 | |
|  * @URL:  the entity URL
 | |
|  * @ID:  the entity PUBLIC ID
 | |
|  * @base:  a possible base for the target URI
 | |
|  * @pctx:  parser context used to set options on new context
 | |
|  *
 | |
|  * Create a parser context for an external entity
 | |
|  * Automatic support for ZLIB/Compress compressed document is provided
 | |
|  * by default if found at compile-time.
 | |
|  *
 | |
|  * Returns the new parser context or NULL
 | |
|  */
 | |
| static xmlParserCtxtPtr
 | |
| xmlCreateEntityParserCtxtInternal(xmlSAXHandlerPtr sax, void *userData,
 | |
|         const xmlChar *URL, const xmlChar *ID, const xmlChar *base,
 | |
|         xmlParserCtxtPtr pctx) {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlParserInputPtr inputStream;
 | |
|     char *directory = NULL;
 | |
|     xmlChar *uri;
 | |
| 
 | |
|     ctxt = xmlNewSAXParserCtxt(sax, userData);
 | |
|     if (ctxt == NULL) {
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     if (pctx != NULL) {
 | |
|         ctxt->options = pctx->options;
 | |
|         ctxt->_private = pctx->_private;
 | |
| 	ctxt->input_id = pctx->input_id;
 | |
|     }
 | |
| 
 | |
|     /* Don't read from stdin. */
 | |
|     if (xmlStrcmp(URL, BAD_CAST "-") == 0)
 | |
|         URL = BAD_CAST "./-";
 | |
| 
 | |
|     uri = xmlBuildURI(URL, base);
 | |
| 
 | |
|     if (uri == NULL) {
 | |
| 	inputStream = xmlLoadExternalEntity((char *)URL, (char *)ID, ctxt);
 | |
| 	if (inputStream == NULL) {
 | |
| 	    xmlFreeParserCtxt(ctxt);
 | |
| 	    return(NULL);
 | |
| 	}
 | |
| 
 | |
| 	inputPush(ctxt, inputStream);
 | |
| 
 | |
| 	if ((ctxt->directory == NULL) && (directory == NULL))
 | |
| 	    directory = xmlParserGetDirectory((char *)URL);
 | |
| 	if ((ctxt->directory == NULL) && (directory != NULL))
 | |
| 	    ctxt->directory = directory;
 | |
|     } else {
 | |
| 	inputStream = xmlLoadExternalEntity((char *)uri, (char *)ID, ctxt);
 | |
| 	if (inputStream == NULL) {
 | |
| 	    xmlFree(uri);
 | |
| 	    xmlFreeParserCtxt(ctxt);
 | |
| 	    return(NULL);
 | |
| 	}
 | |
| 
 | |
| 	inputPush(ctxt, inputStream);
 | |
| 
 | |
| 	if ((ctxt->directory == NULL) && (directory == NULL))
 | |
| 	    directory = xmlParserGetDirectory((char *)uri);
 | |
| 	if ((ctxt->directory == NULL) && (directory != NULL))
 | |
| 	    ctxt->directory = directory;
 | |
| 	xmlFree(uri);
 | |
|     }
 | |
|     return(ctxt);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCreateEntityParserCtxt:
 | |
|  * @URL:  the entity URL
 | |
|  * @ID:  the entity PUBLIC ID
 | |
|  * @base:  a possible base for the target URI
 | |
|  *
 | |
|  * Create a parser context for an external entity
 | |
|  * Automatic support for ZLIB/Compress compressed document is provided
 | |
|  * by default if found at compile-time.
 | |
|  *
 | |
|  * Returns the new parser context or NULL
 | |
|  */
 | |
| xmlParserCtxtPtr
 | |
| xmlCreateEntityParserCtxt(const xmlChar *URL, const xmlChar *ID,
 | |
| 	                  const xmlChar *base) {
 | |
|     return xmlCreateEntityParserCtxtInternal(NULL, NULL, URL, ID, base, NULL);
 | |
| 
 | |
| }
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		Front ends when parsing from a file			*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * xmlCreateURLParserCtxt:
 | |
|  * @filename:  the filename or URL
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  *
 | |
|  * Create a parser context for a file or URL content.
 | |
|  * Automatic support for ZLIB/Compress compressed document is provided
 | |
|  * by default if found at compile-time and for file accesses
 | |
|  *
 | |
|  * Returns the new parser context or NULL
 | |
|  */
 | |
| xmlParserCtxtPtr
 | |
| xmlCreateURLParserCtxt(const char *filename, int options)
 | |
| {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlParserInputPtr inputStream;
 | |
|     char *directory = NULL;
 | |
| 
 | |
|     ctxt = xmlNewParserCtxt();
 | |
|     if (ctxt == NULL) {
 | |
| 	xmlErrMemory(NULL, "cannot allocate parser context");
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     if (options)
 | |
| 	xmlCtxtUseOptionsInternal(ctxt, options, NULL);
 | |
|     ctxt->linenumbers = 1;
 | |
| 
 | |
|     inputStream = xmlLoadExternalEntity(filename, NULL, ctxt);
 | |
|     if (inputStream == NULL) {
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     inputPush(ctxt, inputStream);
 | |
|     if ((ctxt->directory == NULL) && (directory == NULL))
 | |
|         directory = xmlParserGetDirectory(filename);
 | |
|     if ((ctxt->directory == NULL) && (directory != NULL))
 | |
|         ctxt->directory = directory;
 | |
| 
 | |
|     return(ctxt);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCreateFileParserCtxt:
 | |
|  * @filename:  the filename
 | |
|  *
 | |
|  * Create a parser context for a file content.
 | |
|  * Automatic support for ZLIB/Compress compressed document is provided
 | |
|  * by default if found at compile-time.
 | |
|  *
 | |
|  * Returns the new parser context or NULL
 | |
|  */
 | |
| xmlParserCtxtPtr
 | |
| xmlCreateFileParserCtxt(const char *filename)
 | |
| {
 | |
|     return(xmlCreateURLParserCtxt(filename, 0));
 | |
| }
 | |
| 
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
| /**
 | |
|  * xmlSAXParseFileWithData:
 | |
|  * @sax:  the SAX handler block
 | |
|  * @filename:  the filename
 | |
|  * @recovery:  work in recovery mode, i.e. tries to read no Well Formed
 | |
|  *             documents
 | |
|  * @data:  the userdata
 | |
|  *
 | |
|  * DEPRECATED: Use xmlNewSAXParserCtxt and xmlCtxtReadFile.
 | |
|  *
 | |
|  * parse an XML file and build a tree. Automatic support for ZLIB/Compress
 | |
|  * compressed document is provided by default if found at compile-time.
 | |
|  * It use the given SAX function block to handle the parsing callback.
 | |
|  * If sax is NULL, fallback to the default DOM tree building routines.
 | |
|  *
 | |
|  * User data (void *) is stored within the parser context in the
 | |
|  * context's _private member, so it is available nearly everywhere in libxml
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| 
 | |
| xmlDocPtr
 | |
| xmlSAXParseFileWithData(xmlSAXHandlerPtr sax, const char *filename,
 | |
|                         int recovery, void *data) {
 | |
|     xmlDocPtr ret;
 | |
|     xmlParserCtxtPtr ctxt;
 | |
| 
 | |
|     xmlInitParser();
 | |
| 
 | |
|     ctxt = xmlCreateFileParserCtxt(filename);
 | |
|     if (ctxt == NULL) {
 | |
| 	return(NULL);
 | |
|     }
 | |
|     if (sax != NULL) {
 | |
| 	if (ctxt->sax != NULL)
 | |
| 	    xmlFree(ctxt->sax);
 | |
|         ctxt->sax = sax;
 | |
|     }
 | |
|     xmlDetectSAX2(ctxt);
 | |
|     if (data!=NULL) {
 | |
| 	ctxt->_private = data;
 | |
|     }
 | |
| 
 | |
|     if (ctxt->directory == NULL)
 | |
|         ctxt->directory = xmlParserGetDirectory(filename);
 | |
| 
 | |
|     ctxt->recovery = recovery;
 | |
| 
 | |
|     xmlParseDocument(ctxt);
 | |
| 
 | |
|     if ((ctxt->wellFormed) || recovery) {
 | |
|         ret = ctxt->myDoc;
 | |
| 	if ((ret != NULL) && (ctxt->input->buf != NULL)) {
 | |
| 	    if (ctxt->input->buf->compressed > 0)
 | |
| 		ret->compression = 9;
 | |
| 	    else
 | |
| 		ret->compression = ctxt->input->buf->compressed;
 | |
| 	}
 | |
|     }
 | |
|     else {
 | |
|        ret = NULL;
 | |
|        xmlFreeDoc(ctxt->myDoc);
 | |
|        ctxt->myDoc = NULL;
 | |
|     }
 | |
|     if (sax != NULL)
 | |
|         ctxt->sax = NULL;
 | |
|     xmlFreeParserCtxt(ctxt);
 | |
| 
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlSAXParseFile:
 | |
|  * @sax:  the SAX handler block
 | |
|  * @filename:  the filename
 | |
|  * @recovery:  work in recovery mode, i.e. tries to read no Well Formed
 | |
|  *             documents
 | |
|  *
 | |
|  * DEPRECATED: Use xmlNewSAXParserCtxt and xmlCtxtReadFile.
 | |
|  *
 | |
|  * parse an XML file and build a tree. Automatic support for ZLIB/Compress
 | |
|  * compressed document is provided by default if found at compile-time.
 | |
|  * It use the given SAX function block to handle the parsing callback.
 | |
|  * If sax is NULL, fallback to the default DOM tree building routines.
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| 
 | |
| xmlDocPtr
 | |
| xmlSAXParseFile(xmlSAXHandlerPtr sax, const char *filename,
 | |
|                           int recovery) {
 | |
|     return(xmlSAXParseFileWithData(sax,filename,recovery,NULL));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlRecoverDoc:
 | |
|  * @cur:  a pointer to an array of xmlChar
 | |
|  *
 | |
|  * DEPRECATED: Use xmlReadDoc with XML_PARSE_RECOVER.
 | |
|  *
 | |
|  * parse an XML in-memory document and build a tree.
 | |
|  * In the case the document is not Well Formed, a attempt to build a
 | |
|  * tree is tried anyway
 | |
|  *
 | |
|  * Returns the resulting document tree or NULL in case of failure
 | |
|  */
 | |
| 
 | |
| xmlDocPtr
 | |
| xmlRecoverDoc(const xmlChar *cur) {
 | |
|     return(xmlSAXParseDoc(NULL, cur, 1));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseFile:
 | |
|  * @filename:  the filename
 | |
|  *
 | |
|  * DEPRECATED: Use xmlReadFile.
 | |
|  *
 | |
|  * parse an XML file and build a tree. Automatic support for ZLIB/Compress
 | |
|  * compressed document is provided by default if found at compile-time.
 | |
|  *
 | |
|  * Returns the resulting document tree if the file was wellformed,
 | |
|  * NULL otherwise.
 | |
|  */
 | |
| 
 | |
| xmlDocPtr
 | |
| xmlParseFile(const char *filename) {
 | |
|     return(xmlSAXParseFile(NULL, filename, 0));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlRecoverFile:
 | |
|  * @filename:  the filename
 | |
|  *
 | |
|  * DEPRECATED: Use xmlReadFile with XML_PARSE_RECOVER.
 | |
|  *
 | |
|  * parse an XML file and build a tree. Automatic support for ZLIB/Compress
 | |
|  * compressed document is provided by default if found at compile-time.
 | |
|  * In the case the document is not Well Formed, it attempts to build
 | |
|  * a tree anyway
 | |
|  *
 | |
|  * Returns the resulting document tree or NULL in case of failure
 | |
|  */
 | |
| 
 | |
| xmlDocPtr
 | |
| xmlRecoverFile(const char *filename) {
 | |
|     return(xmlSAXParseFile(NULL, filename, 1));
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|  * xmlSetupParserForBuffer:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @buffer:  a xmlChar * buffer
 | |
|  * @filename:  a file name
 | |
|  *
 | |
|  * DEPRECATED: Don't use.
 | |
|  *
 | |
|  * Setup the parser context to parse a new buffer; Clears any prior
 | |
|  * contents from the parser context. The buffer parameter must not be
 | |
|  * NULL, but the filename parameter can be
 | |
|  */
 | |
| void
 | |
| xmlSetupParserForBuffer(xmlParserCtxtPtr ctxt, const xmlChar* buffer,
 | |
|                              const char* filename)
 | |
| {
 | |
|     xmlParserInputPtr input;
 | |
| 
 | |
|     if ((ctxt == NULL) || (buffer == NULL))
 | |
|         return;
 | |
| 
 | |
|     input = xmlNewInputStream(ctxt);
 | |
|     if (input == NULL) {
 | |
|         xmlErrMemory(NULL, "parsing new buffer: out of memory\n");
 | |
|         xmlClearParserCtxt(ctxt);
 | |
|         return;
 | |
|     }
 | |
| 
 | |
|     xmlClearParserCtxt(ctxt);
 | |
|     if (filename != NULL)
 | |
|         input->filename = (char *) xmlCanonicPath((const xmlChar *)filename);
 | |
|     input->base = buffer;
 | |
|     input->cur = buffer;
 | |
|     input->end = &buffer[xmlStrlen(buffer)];
 | |
|     inputPush(ctxt, input);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlSAXUserParseFile:
 | |
|  * @sax:  a SAX handler
 | |
|  * @user_data:  The user data returned on SAX callbacks
 | |
|  * @filename:  a file name
 | |
|  *
 | |
|  * DEPRECATED: Use xmlNewSAXParserCtxt and xmlCtxtReadFile.
 | |
|  *
 | |
|  * parse an XML file and call the given SAX handler routines.
 | |
|  * Automatic support for ZLIB/Compress compressed document is provided
 | |
|  *
 | |
|  * Returns 0 in case of success or a error number otherwise
 | |
|  */
 | |
| int
 | |
| xmlSAXUserParseFile(xmlSAXHandlerPtr sax, void *user_data,
 | |
|                     const char *filename) {
 | |
|     int ret = 0;
 | |
|     xmlParserCtxtPtr ctxt;
 | |
| 
 | |
|     ctxt = xmlCreateFileParserCtxt(filename);
 | |
|     if (ctxt == NULL) return -1;
 | |
|     if (ctxt->sax != (xmlSAXHandlerPtr) &xmlDefaultSAXHandler)
 | |
| 	xmlFree(ctxt->sax);
 | |
|     ctxt->sax = sax;
 | |
|     xmlDetectSAX2(ctxt);
 | |
| 
 | |
|     if (user_data != NULL)
 | |
| 	ctxt->userData = user_data;
 | |
| 
 | |
|     xmlParseDocument(ctxt);
 | |
| 
 | |
|     if (ctxt->wellFormed)
 | |
| 	ret = 0;
 | |
|     else {
 | |
|         if (ctxt->errNo != 0)
 | |
| 	    ret = ctxt->errNo;
 | |
| 	else
 | |
| 	    ret = -1;
 | |
|     }
 | |
|     if (sax != NULL)
 | |
| 	ctxt->sax = NULL;
 | |
|     if (ctxt->myDoc != NULL) {
 | |
|         xmlFreeDoc(ctxt->myDoc);
 | |
| 	ctxt->myDoc = NULL;
 | |
|     }
 | |
|     xmlFreeParserCtxt(ctxt);
 | |
| 
 | |
|     return ret;
 | |
| }
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *		Front ends when parsing from memory			*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * xmlCreateMemoryParserCtxt:
 | |
|  * @buffer:  a pointer to a char array
 | |
|  * @size:  the size of the array
 | |
|  *
 | |
|  * Create a parser context for an XML in-memory document.
 | |
|  *
 | |
|  * Returns the new parser context or NULL
 | |
|  */
 | |
| xmlParserCtxtPtr
 | |
| xmlCreateMemoryParserCtxt(const char *buffer, int size) {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlParserInputPtr input;
 | |
|     xmlParserInputBufferPtr buf;
 | |
| 
 | |
|     if (buffer == NULL)
 | |
| 	return(NULL);
 | |
|     if (size <= 0)
 | |
| 	return(NULL);
 | |
| 
 | |
|     ctxt = xmlNewParserCtxt();
 | |
|     if (ctxt == NULL)
 | |
| 	return(NULL);
 | |
| 
 | |
|     buf = xmlParserInputBufferCreateMem(buffer, size, XML_CHAR_ENCODING_NONE);
 | |
|     if (buf == NULL) {
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     input = xmlNewInputStream(ctxt);
 | |
|     if (input == NULL) {
 | |
| 	xmlFreeParserInputBuffer(buf);
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     input->filename = NULL;
 | |
|     input->buf = buf;
 | |
|     xmlBufResetInput(input->buf->buffer, input);
 | |
| 
 | |
|     inputPush(ctxt, input);
 | |
|     return(ctxt);
 | |
| }
 | |
| 
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
| /**
 | |
|  * xmlSAXParseMemoryWithData:
 | |
|  * @sax:  the SAX handler block
 | |
|  * @buffer:  an pointer to a char array
 | |
|  * @size:  the size of the array
 | |
|  * @recovery:  work in recovery mode, i.e. tries to read no Well Formed
 | |
|  *             documents
 | |
|  * @data:  the userdata
 | |
|  *
 | |
|  * DEPRECATED: Use xmlNewSAXParserCtxt and xmlCtxtReadMemory.
 | |
|  *
 | |
|  * parse an XML in-memory block and use the given SAX function block
 | |
|  * to handle the parsing callback. If sax is NULL, fallback to the default
 | |
|  * DOM tree building routines.
 | |
|  *
 | |
|  * User data (void *) is stored within the parser context in the
 | |
|  * context's _private member, so it is available nearly everywhere in libxml
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| 
 | |
| xmlDocPtr
 | |
| xmlSAXParseMemoryWithData(xmlSAXHandlerPtr sax, const char *buffer,
 | |
| 	          int size, int recovery, void *data) {
 | |
|     xmlDocPtr ret;
 | |
|     xmlParserCtxtPtr ctxt;
 | |
| 
 | |
|     xmlInitParser();
 | |
| 
 | |
|     ctxt = xmlCreateMemoryParserCtxt(buffer, size);
 | |
|     if (ctxt == NULL) return(NULL);
 | |
|     if (sax != NULL) {
 | |
| 	if (ctxt->sax != NULL)
 | |
| 	    xmlFree(ctxt->sax);
 | |
|         ctxt->sax = sax;
 | |
|     }
 | |
|     xmlDetectSAX2(ctxt);
 | |
|     if (data!=NULL) {
 | |
| 	ctxt->_private=data;
 | |
|     }
 | |
| 
 | |
|     ctxt->recovery = recovery;
 | |
| 
 | |
|     xmlParseDocument(ctxt);
 | |
| 
 | |
|     if ((ctxt->wellFormed) || recovery) ret = ctxt->myDoc;
 | |
|     else {
 | |
|        ret = NULL;
 | |
|        xmlFreeDoc(ctxt->myDoc);
 | |
|        ctxt->myDoc = NULL;
 | |
|     }
 | |
|     if (sax != NULL)
 | |
| 	ctxt->sax = NULL;
 | |
|     xmlFreeParserCtxt(ctxt);
 | |
| 
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlSAXParseMemory:
 | |
|  * @sax:  the SAX handler block
 | |
|  * @buffer:  an pointer to a char array
 | |
|  * @size:  the size of the array
 | |
|  * @recovery:  work in recovery mode, i.e. tries to read not Well Formed
 | |
|  *             documents
 | |
|  *
 | |
|  * DEPRECATED: Use xmlNewSAXParserCtxt and xmlCtxtReadMemory.
 | |
|  *
 | |
|  * parse an XML in-memory block and use the given SAX function block
 | |
|  * to handle the parsing callback. If sax is NULL, fallback to the default
 | |
|  * DOM tree building routines.
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| xmlDocPtr
 | |
| xmlSAXParseMemory(xmlSAXHandlerPtr sax, const char *buffer,
 | |
| 	          int size, int recovery) {
 | |
|     return xmlSAXParseMemoryWithData(sax, buffer, size, recovery, NULL);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseMemory:
 | |
|  * @buffer:  an pointer to a char array
 | |
|  * @size:  the size of the array
 | |
|  *
 | |
|  * DEPRECATED: Use xmlReadMemory.
 | |
|  *
 | |
|  * parse an XML in-memory block and build a tree.
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| 
 | |
| xmlDocPtr xmlParseMemory(const char *buffer, int size) {
 | |
|    return(xmlSAXParseMemory(NULL, buffer, size, 0));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlRecoverMemory:
 | |
|  * @buffer:  an pointer to a char array
 | |
|  * @size:  the size of the array
 | |
|  *
 | |
|  * DEPRECATED: Use xmlReadMemory with XML_PARSE_RECOVER.
 | |
|  *
 | |
|  * parse an XML in-memory block and build a tree.
 | |
|  * In the case the document is not Well Formed, an attempt to
 | |
|  * build a tree is tried anyway
 | |
|  *
 | |
|  * Returns the resulting document tree or NULL in case of error
 | |
|  */
 | |
| 
 | |
| xmlDocPtr xmlRecoverMemory(const char *buffer, int size) {
 | |
|    return(xmlSAXParseMemory(NULL, buffer, size, 1));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlSAXUserParseMemory:
 | |
|  * @sax:  a SAX handler
 | |
|  * @user_data:  The user data returned on SAX callbacks
 | |
|  * @buffer:  an in-memory XML document input
 | |
|  * @size:  the length of the XML document in bytes
 | |
|  *
 | |
|  * DEPRECATED: Use xmlNewSAXParserCtxt and xmlCtxtReadMemory.
 | |
|  *
 | |
|  * parse an XML in-memory buffer and call the given SAX handler routines.
 | |
|  *
 | |
|  * Returns 0 in case of success or a error number otherwise
 | |
|  */
 | |
| int xmlSAXUserParseMemory(xmlSAXHandlerPtr sax, void *user_data,
 | |
| 			  const char *buffer, int size) {
 | |
|     int ret = 0;
 | |
|     xmlParserCtxtPtr ctxt;
 | |
| 
 | |
|     xmlInitParser();
 | |
| 
 | |
|     ctxt = xmlCreateMemoryParserCtxt(buffer, size);
 | |
|     if (ctxt == NULL) return -1;
 | |
|     if (ctxt->sax != (xmlSAXHandlerPtr) &xmlDefaultSAXHandler)
 | |
|         xmlFree(ctxt->sax);
 | |
|     ctxt->sax = sax;
 | |
|     xmlDetectSAX2(ctxt);
 | |
| 
 | |
|     if (user_data != NULL)
 | |
| 	ctxt->userData = user_data;
 | |
| 
 | |
|     xmlParseDocument(ctxt);
 | |
| 
 | |
|     if (ctxt->wellFormed)
 | |
| 	ret = 0;
 | |
|     else {
 | |
|         if (ctxt->errNo != 0)
 | |
| 	    ret = ctxt->errNo;
 | |
| 	else
 | |
| 	    ret = -1;
 | |
|     }
 | |
|     if (sax != NULL)
 | |
|         ctxt->sax = NULL;
 | |
|     if (ctxt->myDoc != NULL) {
 | |
|         xmlFreeDoc(ctxt->myDoc);
 | |
| 	ctxt->myDoc = NULL;
 | |
|     }
 | |
|     xmlFreeParserCtxt(ctxt);
 | |
| 
 | |
|     return ret;
 | |
| }
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
| 
 | |
| /**
 | |
|  * xmlCreateDocParserCtxt:
 | |
|  * @str:  a pointer to an array of xmlChar
 | |
|  *
 | |
|  * Creates a parser context for an XML in-memory document.
 | |
|  *
 | |
|  * Returns the new parser context or NULL
 | |
|  */
 | |
| xmlParserCtxtPtr
 | |
| xmlCreateDocParserCtxt(const xmlChar *str) {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlParserInputPtr input;
 | |
|     xmlParserInputBufferPtr buf;
 | |
| 
 | |
|     if (str == NULL)
 | |
| 	return(NULL);
 | |
| 
 | |
|     ctxt = xmlNewParserCtxt();
 | |
|     if (ctxt == NULL)
 | |
| 	return(NULL);
 | |
| 
 | |
|     buf = xmlParserInputBufferCreateString(str);
 | |
|     if (buf == NULL) {
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     input = xmlNewInputStream(ctxt);
 | |
|     if (input == NULL) {
 | |
| 	xmlFreeParserInputBuffer(buf);
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     input->filename = NULL;
 | |
|     input->buf = buf;
 | |
|     xmlBufResetInput(input->buf->buffer, input);
 | |
| 
 | |
|     inputPush(ctxt, input);
 | |
|     return(ctxt);
 | |
| }
 | |
| 
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
| /**
 | |
|  * xmlSAXParseDoc:
 | |
|  * @sax:  the SAX handler block
 | |
|  * @cur:  a pointer to an array of xmlChar
 | |
|  * @recovery:  work in recovery mode, i.e. tries to read no Well Formed
 | |
|  *             documents
 | |
|  *
 | |
|  * DEPRECATED: Use xmlNewSAXParserCtxt and xmlCtxtReadDoc.
 | |
|  *
 | |
|  * parse an XML in-memory document and build a tree.
 | |
|  * It use the given SAX function block to handle the parsing callback.
 | |
|  * If sax is NULL, fallback to the default DOM tree building routines.
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| 
 | |
| xmlDocPtr
 | |
| xmlSAXParseDoc(xmlSAXHandlerPtr sax, const xmlChar *cur, int recovery) {
 | |
|     xmlDocPtr ret;
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlSAXHandlerPtr oldsax = NULL;
 | |
| 
 | |
|     if (cur == NULL) return(NULL);
 | |
| 
 | |
| 
 | |
|     ctxt = xmlCreateDocParserCtxt(cur);
 | |
|     if (ctxt == NULL) return(NULL);
 | |
|     if (sax != NULL) {
 | |
|         oldsax = ctxt->sax;
 | |
|         ctxt->sax = sax;
 | |
|         ctxt->userData = NULL;
 | |
|     }
 | |
|     xmlDetectSAX2(ctxt);
 | |
| 
 | |
|     xmlParseDocument(ctxt);
 | |
|     if ((ctxt->wellFormed) || recovery) ret = ctxt->myDoc;
 | |
|     else {
 | |
|        ret = NULL;
 | |
|        xmlFreeDoc(ctxt->myDoc);
 | |
|        ctxt->myDoc = NULL;
 | |
|     }
 | |
|     if (sax != NULL)
 | |
| 	ctxt->sax = oldsax;
 | |
|     xmlFreeParserCtxt(ctxt);
 | |
| 
 | |
|     return(ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlParseDoc:
 | |
|  * @cur:  a pointer to an array of xmlChar
 | |
|  *
 | |
|  * DEPRECATED: Use xmlReadDoc.
 | |
|  *
 | |
|  * parse an XML in-memory document and build a tree.
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| 
 | |
| xmlDocPtr
 | |
| xmlParseDoc(const xmlChar *cur) {
 | |
|     return(xmlSAXParseDoc(NULL, cur, 0));
 | |
| }
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
| 
 | |
| #ifdef LIBXML_LEGACY_ENABLED
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *	Specific function to keep track of entities references		*
 | |
|  *	and used by the XSLT debugger					*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| static xmlEntityReferenceFunc xmlEntityRefFunc = NULL;
 | |
| 
 | |
| /**
 | |
|  * xmlAddEntityReference:
 | |
|  * @ent : A valid entity
 | |
|  * @firstNode : A valid first node for children of entity
 | |
|  * @lastNode : A valid last node of children entity
 | |
|  *
 | |
|  * Notify of a reference to an entity of type XML_EXTERNAL_GENERAL_PARSED_ENTITY
 | |
|  */
 | |
| static void
 | |
| xmlAddEntityReference(xmlEntityPtr ent, xmlNodePtr firstNode,
 | |
|                       xmlNodePtr lastNode)
 | |
| {
 | |
|     if (xmlEntityRefFunc != NULL) {
 | |
|         (*xmlEntityRefFunc) (ent, firstNode, lastNode);
 | |
|     }
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|  * xmlSetEntityReferenceFunc:
 | |
|  * @func: A valid function
 | |
|  *
 | |
|  * Set the function to call call back when a xml reference has been made
 | |
|  */
 | |
| void
 | |
| xmlSetEntityReferenceFunc(xmlEntityReferenceFunc func)
 | |
| {
 | |
|     xmlEntityRefFunc = func;
 | |
| }
 | |
| #endif /* LIBXML_LEGACY_ENABLED */
 | |
| 
 | |
| /************************************************************************
 | |
|  *									*
 | |
|  *	New set (2.6.0) of simpler and more flexible APIs		*
 | |
|  *									*
 | |
|  ************************************************************************/
 | |
| 
 | |
| /**
 | |
|  * DICT_FREE:
 | |
|  * @str:  a string
 | |
|  *
 | |
|  * Free a string if it is not owned by the "dict" dictionary in the
 | |
|  * current scope
 | |
|  */
 | |
| #define DICT_FREE(str)						\
 | |
| 	if ((str) && ((!dict) ||				\
 | |
| 	    (xmlDictOwns(dict, (const xmlChar *)(str)) == 0)))	\
 | |
| 	    xmlFree((char *)(str));
 | |
| 
 | |
| /**
 | |
|  * xmlCtxtReset:
 | |
|  * @ctxt: an XML parser context
 | |
|  *
 | |
|  * Reset a parser context
 | |
|  */
 | |
| void
 | |
| xmlCtxtReset(xmlParserCtxtPtr ctxt)
 | |
| {
 | |
|     xmlParserInputPtr input;
 | |
|     xmlDictPtr dict;
 | |
| 
 | |
|     if (ctxt == NULL)
 | |
|         return;
 | |
| 
 | |
|     dict = ctxt->dict;
 | |
| 
 | |
|     while ((input = inputPop(ctxt)) != NULL) { /* Non consuming */
 | |
|         xmlFreeInputStream(input);
 | |
|     }
 | |
|     ctxt->inputNr = 0;
 | |
|     ctxt->input = NULL;
 | |
| 
 | |
|     ctxt->spaceNr = 0;
 | |
|     if (ctxt->spaceTab != NULL) {
 | |
| 	ctxt->spaceTab[0] = -1;
 | |
| 	ctxt->space = &ctxt->spaceTab[0];
 | |
|     } else {
 | |
|         ctxt->space = NULL;
 | |
|     }
 | |
| 
 | |
| 
 | |
|     ctxt->nodeNr = 0;
 | |
|     ctxt->node = NULL;
 | |
| 
 | |
|     ctxt->nameNr = 0;
 | |
|     ctxt->name = NULL;
 | |
| 
 | |
|     ctxt->nsNr = 0;
 | |
|     xmlParserNsReset(ctxt->nsdb);
 | |
| 
 | |
|     DICT_FREE(ctxt->version);
 | |
|     ctxt->version = NULL;
 | |
|     DICT_FREE(ctxt->encoding);
 | |
|     ctxt->encoding = NULL;
 | |
|     DICT_FREE(ctxt->directory);
 | |
|     ctxt->directory = NULL;
 | |
|     DICT_FREE(ctxt->extSubURI);
 | |
|     ctxt->extSubURI = NULL;
 | |
|     DICT_FREE(ctxt->extSubSystem);
 | |
|     ctxt->extSubSystem = NULL;
 | |
|     if (ctxt->myDoc != NULL)
 | |
|         xmlFreeDoc(ctxt->myDoc);
 | |
|     ctxt->myDoc = NULL;
 | |
| 
 | |
|     ctxt->standalone = -1;
 | |
|     ctxt->hasExternalSubset = 0;
 | |
|     ctxt->hasPErefs = 0;
 | |
|     ctxt->html = 0;
 | |
|     ctxt->external = 0;
 | |
|     ctxt->instate = XML_PARSER_START;
 | |
|     ctxt->token = 0;
 | |
| 
 | |
|     ctxt->wellFormed = 1;
 | |
|     ctxt->nsWellFormed = 1;
 | |
|     ctxt->disableSAX = 0;
 | |
|     ctxt->valid = 1;
 | |
| #if 0
 | |
|     ctxt->vctxt.userData = ctxt;
 | |
|     ctxt->vctxt.error = xmlParserValidityError;
 | |
|     ctxt->vctxt.warning = xmlParserValidityWarning;
 | |
| #endif
 | |
|     ctxt->record_info = 0;
 | |
|     ctxt->checkIndex = 0;
 | |
|     ctxt->endCheckState = 0;
 | |
|     ctxt->inSubset = 0;
 | |
|     ctxt->errNo = XML_ERR_OK;
 | |
|     ctxt->depth = 0;
 | |
|     ctxt->catalogs = NULL;
 | |
|     ctxt->sizeentities = 0;
 | |
|     ctxt->sizeentcopy = 0;
 | |
|     xmlInitNodeInfoSeq(&ctxt->node_seq);
 | |
| 
 | |
|     if (ctxt->attsDefault != NULL) {
 | |
|         xmlHashFree(ctxt->attsDefault, xmlHashDefaultDeallocator);
 | |
|         ctxt->attsDefault = NULL;
 | |
|     }
 | |
|     if (ctxt->attsSpecial != NULL) {
 | |
|         xmlHashFree(ctxt->attsSpecial, NULL);
 | |
|         ctxt->attsSpecial = NULL;
 | |
|     }
 | |
| 
 | |
| #ifdef LIBXML_CATALOG_ENABLED
 | |
|     if (ctxt->catalogs != NULL)
 | |
| 	xmlCatalogFreeLocal(ctxt->catalogs);
 | |
| #endif
 | |
|     ctxt->nbErrors = 0;
 | |
|     ctxt->nbWarnings = 0;
 | |
|     if (ctxt->lastError.code != XML_ERR_OK)
 | |
|         xmlResetError(&ctxt->lastError);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCtxtResetPush:
 | |
|  * @ctxt: an XML parser context
 | |
|  * @chunk:  a pointer to an array of chars
 | |
|  * @size:  number of chars in the array
 | |
|  * @filename:  an optional file name or URI
 | |
|  * @encoding:  the document encoding, or NULL
 | |
|  *
 | |
|  * Reset a push parser context
 | |
|  *
 | |
|  * Returns 0 in case of success and 1 in case of error
 | |
|  */
 | |
| int
 | |
| xmlCtxtResetPush(xmlParserCtxtPtr ctxt, const char *chunk,
 | |
|                  int size, const char *filename, const char *encoding)
 | |
| {
 | |
|     xmlParserInputPtr inputStream;
 | |
|     xmlParserInputBufferPtr buf;
 | |
| 
 | |
|     if (ctxt == NULL)
 | |
|         return(1);
 | |
| 
 | |
|     buf = xmlAllocParserInputBuffer(XML_CHAR_ENCODING_NONE);
 | |
|     if (buf == NULL)
 | |
|         return(1);
 | |
| 
 | |
|     if (ctxt == NULL) {
 | |
|         xmlFreeParserInputBuffer(buf);
 | |
|         return(1);
 | |
|     }
 | |
| 
 | |
|     xmlCtxtReset(ctxt);
 | |
| 
 | |
|     if (filename == NULL) {
 | |
|         ctxt->directory = NULL;
 | |
|     } else {
 | |
|         ctxt->directory = xmlParserGetDirectory(filename);
 | |
|     }
 | |
| 
 | |
|     inputStream = xmlNewInputStream(ctxt);
 | |
|     if (inputStream == NULL) {
 | |
|         xmlFreeParserInputBuffer(buf);
 | |
|         return(1);
 | |
|     }
 | |
| 
 | |
|     if (filename == NULL)
 | |
|         inputStream->filename = NULL;
 | |
|     else
 | |
|         inputStream->filename = (char *)
 | |
|             xmlCanonicPath((const xmlChar *) filename);
 | |
|     inputStream->buf = buf;
 | |
|     xmlBufResetInput(buf->buffer, inputStream);
 | |
| 
 | |
|     inputPush(ctxt, inputStream);
 | |
| 
 | |
|     if ((size > 0) && (chunk != NULL) && (ctxt->input != NULL) &&
 | |
|         (ctxt->input->buf != NULL)) {
 | |
|         size_t pos = ctxt->input->cur - ctxt->input->base;
 | |
|         int res;
 | |
| 
 | |
|         res = xmlParserInputBufferPush(ctxt->input->buf, size, chunk);
 | |
|         xmlBufUpdateInput(ctxt->input->buf->buffer, ctxt->input, pos);
 | |
|         if (res < 0) {
 | |
|             xmlFatalErr(ctxt, ctxt->input->buf->error, NULL);
 | |
|             xmlHaltParser(ctxt);
 | |
|             return(1);
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     if (encoding != NULL) {
 | |
|         xmlCharEncodingHandlerPtr hdlr;
 | |
| 
 | |
|         hdlr = xmlFindCharEncodingHandler(encoding);
 | |
|         if (hdlr != NULL) {
 | |
|             xmlSwitchToEncoding(ctxt, hdlr);
 | |
| 	} else {
 | |
| 	    xmlFatalErrMsgStr(ctxt, XML_ERR_UNSUPPORTED_ENCODING,
 | |
| 			      "Unsupported encoding %s\n", BAD_CAST encoding);
 | |
|         }
 | |
|     }
 | |
| 
 | |
|     return(0);
 | |
| }
 | |
| 
 | |
| 
 | |
| /**
 | |
|  * xmlCtxtUseOptionsInternal:
 | |
|  * @ctxt: an XML parser context
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  * @encoding:  the user provided encoding to use
 | |
|  *
 | |
|  * Applies the options to the parser context
 | |
|  *
 | |
|  * Returns 0 in case of success, the set of unknown or unimplemented options
 | |
|  *         in case of error.
 | |
|  */
 | |
| static int
 | |
| xmlCtxtUseOptionsInternal(xmlParserCtxtPtr ctxt, int options, const char *encoding)
 | |
| {
 | |
|     if (ctxt == NULL)
 | |
|         return(-1);
 | |
|     if (encoding != NULL) {
 | |
|         if (ctxt->encoding != NULL)
 | |
| 	    xmlFree((xmlChar *) ctxt->encoding);
 | |
|         ctxt->encoding = xmlStrdup((const xmlChar *) encoding);
 | |
|     }
 | |
|     if (options & XML_PARSE_RECOVER) {
 | |
|         ctxt->recovery = 1;
 | |
|         options -= XML_PARSE_RECOVER;
 | |
| 	ctxt->options |= XML_PARSE_RECOVER;
 | |
|     } else
 | |
|         ctxt->recovery = 0;
 | |
|     if (options & XML_PARSE_DTDLOAD) {
 | |
|         ctxt->loadsubset = XML_DETECT_IDS;
 | |
|         options -= XML_PARSE_DTDLOAD;
 | |
| 	ctxt->options |= XML_PARSE_DTDLOAD;
 | |
|     } else
 | |
|         ctxt->loadsubset = 0;
 | |
|     if (options & XML_PARSE_DTDATTR) {
 | |
|         ctxt->loadsubset |= XML_COMPLETE_ATTRS;
 | |
|         options -= XML_PARSE_DTDATTR;
 | |
| 	ctxt->options |= XML_PARSE_DTDATTR;
 | |
|     }
 | |
|     if (options & XML_PARSE_NOENT) {
 | |
|         ctxt->replaceEntities = 1;
 | |
|         /* ctxt->loadsubset |= XML_DETECT_IDS; */
 | |
|         options -= XML_PARSE_NOENT;
 | |
| 	ctxt->options |= XML_PARSE_NOENT;
 | |
|     } else
 | |
|         ctxt->replaceEntities = 0;
 | |
|     if (options & XML_PARSE_PEDANTIC) {
 | |
|         ctxt->pedantic = 1;
 | |
|         options -= XML_PARSE_PEDANTIC;
 | |
| 	ctxt->options |= XML_PARSE_PEDANTIC;
 | |
|     } else
 | |
|         ctxt->pedantic = 0;
 | |
|     if (options & XML_PARSE_NOBLANKS) {
 | |
|         ctxt->keepBlanks = 0;
 | |
|         ctxt->sax->ignorableWhitespace = xmlSAX2IgnorableWhitespace;
 | |
|         options -= XML_PARSE_NOBLANKS;
 | |
| 	ctxt->options |= XML_PARSE_NOBLANKS;
 | |
|     } else
 | |
|         ctxt->keepBlanks = 1;
 | |
|     if (options & XML_PARSE_DTDVALID) {
 | |
|         ctxt->validate = 1;
 | |
|         if (options & XML_PARSE_NOWARNING)
 | |
|             ctxt->vctxt.warning = NULL;
 | |
|         if (options & XML_PARSE_NOERROR)
 | |
|             ctxt->vctxt.error = NULL;
 | |
|         options -= XML_PARSE_DTDVALID;
 | |
| 	ctxt->options |= XML_PARSE_DTDVALID;
 | |
|     } else
 | |
|         ctxt->validate = 0;
 | |
|     if (options & XML_PARSE_NOWARNING) {
 | |
|         ctxt->sax->warning = NULL;
 | |
|         options -= XML_PARSE_NOWARNING;
 | |
|     }
 | |
|     if (options & XML_PARSE_NOERROR) {
 | |
|         ctxt->sax->error = NULL;
 | |
|         ctxt->sax->fatalError = NULL;
 | |
|         options -= XML_PARSE_NOERROR;
 | |
|     }
 | |
| #ifdef LIBXML_SAX1_ENABLED
 | |
|     if (options & XML_PARSE_SAX1) {
 | |
|         ctxt->sax->startElementNs = NULL;
 | |
|         ctxt->sax->endElementNs = NULL;
 | |
|         ctxt->sax->initialized = 1;
 | |
|         options -= XML_PARSE_SAX1;
 | |
| 	ctxt->options |= XML_PARSE_SAX1;
 | |
|     }
 | |
| #endif /* LIBXML_SAX1_ENABLED */
 | |
|     if (options & XML_PARSE_NODICT) {
 | |
|         ctxt->dictNames = 0;
 | |
|         options -= XML_PARSE_NODICT;
 | |
| 	ctxt->options |= XML_PARSE_NODICT;
 | |
|     } else {
 | |
|         ctxt->dictNames = 1;
 | |
|     }
 | |
|     if (options & XML_PARSE_NOCDATA) {
 | |
|         ctxt->sax->cdataBlock = NULL;
 | |
|         options -= XML_PARSE_NOCDATA;
 | |
| 	ctxt->options |= XML_PARSE_NOCDATA;
 | |
|     }
 | |
|     if (options & XML_PARSE_NSCLEAN) {
 | |
| 	ctxt->options |= XML_PARSE_NSCLEAN;
 | |
|         options -= XML_PARSE_NSCLEAN;
 | |
|     }
 | |
|     if (options & XML_PARSE_NONET) {
 | |
| 	ctxt->options |= XML_PARSE_NONET;
 | |
|         options -= XML_PARSE_NONET;
 | |
|     }
 | |
|     if (options & XML_PARSE_COMPACT) {
 | |
| 	ctxt->options |= XML_PARSE_COMPACT;
 | |
|         options -= XML_PARSE_COMPACT;
 | |
|     }
 | |
|     if (options & XML_PARSE_OLD10) {
 | |
| 	ctxt->options |= XML_PARSE_OLD10;
 | |
|         options -= XML_PARSE_OLD10;
 | |
|     }
 | |
|     if (options & XML_PARSE_NOBASEFIX) {
 | |
| 	ctxt->options |= XML_PARSE_NOBASEFIX;
 | |
|         options -= XML_PARSE_NOBASEFIX;
 | |
|     }
 | |
|     if (options & XML_PARSE_HUGE) {
 | |
| 	ctxt->options |= XML_PARSE_HUGE;
 | |
|         options -= XML_PARSE_HUGE;
 | |
|         if (ctxt->dict != NULL)
 | |
|             xmlDictSetLimit(ctxt->dict, 0);
 | |
|     }
 | |
|     if (options & XML_PARSE_OLDSAX) {
 | |
| 	ctxt->options |= XML_PARSE_OLDSAX;
 | |
|         options -= XML_PARSE_OLDSAX;
 | |
|     }
 | |
|     if (options & XML_PARSE_IGNORE_ENC) {
 | |
| 	ctxt->options |= XML_PARSE_IGNORE_ENC;
 | |
|         options -= XML_PARSE_IGNORE_ENC;
 | |
|     }
 | |
|     if (options & XML_PARSE_BIG_LINES) {
 | |
| 	ctxt->options |= XML_PARSE_BIG_LINES;
 | |
|         options -= XML_PARSE_BIG_LINES;
 | |
|     }
 | |
|     ctxt->linenumbers = 1;
 | |
|     return (options);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCtxtUseOptions:
 | |
|  * @ctxt: an XML parser context
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  *
 | |
|  * Applies the options to the parser context
 | |
|  *
 | |
|  * Returns 0 in case of success, the set of unknown or unimplemented options
 | |
|  *         in case of error.
 | |
|  */
 | |
| int
 | |
| xmlCtxtUseOptions(xmlParserCtxtPtr ctxt, int options)
 | |
| {
 | |
|    return(xmlCtxtUseOptionsInternal(ctxt, options, NULL));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCtxtSetMaxAmplification:
 | |
|  * @ctxt: an XML parser context
 | |
|  * @maxAmpl:  maximum amplification factor
 | |
|  *
 | |
|  * To protect against exponential entity expansion ("billion laughs"), the
 | |
|  * size of serialized output is (roughly) limited to the input size
 | |
|  * multiplied by this factor. The default value is 5.
 | |
|  *
 | |
|  * When working with documents making heavy use of entity expansion, it can
 | |
|  * be necessary to increase the value. For security reasons, this should only
 | |
|  * be considered when processing trusted input.
 | |
|  */
 | |
| void
 | |
| xmlCtxtSetMaxAmplification(xmlParserCtxtPtr ctxt, unsigned maxAmpl)
 | |
| {
 | |
|     ctxt->maxAmpl = maxAmpl;
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlDoRead:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @URL:  the base URL to use for the document
 | |
|  * @encoding:  the document encoding, or NULL
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  * @reuse:  keep the context for reuse
 | |
|  *
 | |
|  * Common front-end for the xmlRead functions
 | |
|  *
 | |
|  * Returns the resulting document tree or NULL
 | |
|  */
 | |
| static xmlDocPtr
 | |
| xmlDoRead(xmlParserCtxtPtr ctxt, const char *URL, const char *encoding,
 | |
|           int options, int reuse)
 | |
| {
 | |
|     xmlDocPtr ret;
 | |
| 
 | |
|     xmlCtxtUseOptionsInternal(ctxt, options, encoding);
 | |
|     if (encoding != NULL) {
 | |
|         xmlCharEncodingHandlerPtr hdlr;
 | |
| 
 | |
|         /*
 | |
|          * TODO: We should consider to set XML_PARSE_IGNORE_ENC if the
 | |
|          * caller provided an encoding. Otherwise, we might switch to
 | |
|          * the encoding from the XML declaration which is likely to
 | |
|          * break things. Also see xmlSwitchInputEncoding.
 | |
|          */
 | |
| 	hdlr = xmlFindCharEncodingHandler(encoding);
 | |
| 	if (hdlr != NULL)
 | |
| 	    xmlSwitchToEncoding(ctxt, hdlr);
 | |
|     }
 | |
|     if ((URL != NULL) && (ctxt->input != NULL) &&
 | |
|         (ctxt->input->filename == NULL))
 | |
|         ctxt->input->filename = (char *) xmlStrdup((const xmlChar *) URL);
 | |
|     xmlParseDocument(ctxt);
 | |
|     if ((ctxt->wellFormed) || ctxt->recovery)
 | |
|         ret = ctxt->myDoc;
 | |
|     else {
 | |
|         ret = NULL;
 | |
| 	if (ctxt->myDoc != NULL) {
 | |
| 	    xmlFreeDoc(ctxt->myDoc);
 | |
| 	}
 | |
|     }
 | |
|     ctxt->myDoc = NULL;
 | |
|     if (!reuse) {
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
|     }
 | |
| 
 | |
|     return (ret);
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlReadDoc:
 | |
|  * @cur:  a pointer to a zero terminated string
 | |
|  * @URL:  the base URL to use for the document
 | |
|  * @encoding:  the document encoding, or NULL
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  *
 | |
|  * parse an XML in-memory document and build a tree.
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| xmlDocPtr
 | |
| xmlReadDoc(const xmlChar * cur, const char *URL, const char *encoding, int options)
 | |
| {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
| 
 | |
|     if (cur == NULL)
 | |
|         return (NULL);
 | |
|     xmlInitParser();
 | |
| 
 | |
|     ctxt = xmlCreateDocParserCtxt(cur);
 | |
|     if (ctxt == NULL)
 | |
|         return (NULL);
 | |
|     return (xmlDoRead(ctxt, URL, encoding, options, 0));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlReadFile:
 | |
|  * @filename:  a file or URL
 | |
|  * @encoding:  the document encoding, or NULL
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  *
 | |
|  * parse an XML file from the filesystem or the network.
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| xmlDocPtr
 | |
| xmlReadFile(const char *filename, const char *encoding, int options)
 | |
| {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
| 
 | |
|     xmlInitParser();
 | |
|     ctxt = xmlCreateURLParserCtxt(filename, options);
 | |
|     if (ctxt == NULL)
 | |
|         return (NULL);
 | |
|     return (xmlDoRead(ctxt, NULL, encoding, options, 0));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlReadMemory:
 | |
|  * @buffer:  a pointer to a char array
 | |
|  * @size:  the size of the array
 | |
|  * @URL:  the base URL to use for the document
 | |
|  * @encoding:  the document encoding, or NULL
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  *
 | |
|  * parse an XML in-memory document and build a tree.
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| xmlDocPtr
 | |
| xmlReadMemory(const char *buffer, int size, const char *URL, const char *encoding, int options)
 | |
| {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
| 
 | |
|     xmlInitParser();
 | |
|     ctxt = xmlCreateMemoryParserCtxt(buffer, size);
 | |
|     if (ctxt == NULL)
 | |
|         return (NULL);
 | |
|     return (xmlDoRead(ctxt, URL, encoding, options, 0));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlReadFd:
 | |
|  * @fd:  an open file descriptor
 | |
|  * @URL:  the base URL to use for the document
 | |
|  * @encoding:  the document encoding, or NULL
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  *
 | |
|  * parse an XML from a file descriptor and build a tree.
 | |
|  * NOTE that the file descriptor will not be closed when the
 | |
|  *      reader is closed or reset.
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| xmlDocPtr
 | |
| xmlReadFd(int fd, const char *URL, const char *encoding, int options)
 | |
| {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlParserInputBufferPtr input;
 | |
|     xmlParserInputPtr stream;
 | |
| 
 | |
|     if (fd < 0)
 | |
|         return (NULL);
 | |
|     xmlInitParser();
 | |
| 
 | |
|     input = xmlParserInputBufferCreateFd(fd, XML_CHAR_ENCODING_NONE);
 | |
|     if (input == NULL)
 | |
|         return (NULL);
 | |
|     input->closecallback = NULL;
 | |
|     ctxt = xmlNewParserCtxt();
 | |
|     if (ctxt == NULL) {
 | |
|         xmlFreeParserInputBuffer(input);
 | |
|         return (NULL);
 | |
|     }
 | |
|     stream = xmlNewIOInputStream(ctxt, input, XML_CHAR_ENCODING_NONE);
 | |
|     if (stream == NULL) {
 | |
|         xmlFreeParserInputBuffer(input);
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
|         return (NULL);
 | |
|     }
 | |
|     inputPush(ctxt, stream);
 | |
|     return (xmlDoRead(ctxt, URL, encoding, options, 0));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlReadIO:
 | |
|  * @ioread:  an I/O read function
 | |
|  * @ioclose:  an I/O close function
 | |
|  * @ioctx:  an I/O handler
 | |
|  * @URL:  the base URL to use for the document
 | |
|  * @encoding:  the document encoding, or NULL
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  *
 | |
|  * parse an XML document from I/O functions and source and build a tree.
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| xmlDocPtr
 | |
| xmlReadIO(xmlInputReadCallback ioread, xmlInputCloseCallback ioclose,
 | |
|           void *ioctx, const char *URL, const char *encoding, int options)
 | |
| {
 | |
|     xmlParserCtxtPtr ctxt;
 | |
|     xmlParserInputBufferPtr input;
 | |
|     xmlParserInputPtr stream;
 | |
| 
 | |
|     if (ioread == NULL)
 | |
|         return (NULL);
 | |
|     xmlInitParser();
 | |
| 
 | |
|     input = xmlParserInputBufferCreateIO(ioread, ioclose, ioctx,
 | |
|                                          XML_CHAR_ENCODING_NONE);
 | |
|     if (input == NULL) {
 | |
|         if (ioclose != NULL)
 | |
|             ioclose(ioctx);
 | |
|         return (NULL);
 | |
|     }
 | |
|     ctxt = xmlNewParserCtxt();
 | |
|     if (ctxt == NULL) {
 | |
|         xmlFreeParserInputBuffer(input);
 | |
|         return (NULL);
 | |
|     }
 | |
|     stream = xmlNewIOInputStream(ctxt, input, XML_CHAR_ENCODING_NONE);
 | |
|     if (stream == NULL) {
 | |
|         xmlFreeParserInputBuffer(input);
 | |
| 	xmlFreeParserCtxt(ctxt);
 | |
|         return (NULL);
 | |
|     }
 | |
|     inputPush(ctxt, stream);
 | |
|     return (xmlDoRead(ctxt, URL, encoding, options, 0));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCtxtReadDoc:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @str:  a pointer to a zero terminated string
 | |
|  * @URL:  the base URL to use for the document
 | |
|  * @encoding:  the document encoding, or NULL
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  *
 | |
|  * parse an XML in-memory document and build a tree.
 | |
|  * This reuses the existing @ctxt parser context
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| xmlDocPtr
 | |
| xmlCtxtReadDoc(xmlParserCtxtPtr ctxt, const xmlChar *str,
 | |
|                const char *URL, const char *encoding, int options)
 | |
| {
 | |
|     xmlParserInputBufferPtr input;
 | |
|     xmlParserInputPtr stream;
 | |
| 
 | |
|     if (ctxt == NULL)
 | |
|         return (NULL);
 | |
|     if (str == NULL)
 | |
|         return (NULL);
 | |
|     xmlInitParser();
 | |
| 
 | |
|     xmlCtxtReset(ctxt);
 | |
| 
 | |
|     input = xmlParserInputBufferCreateString(str);
 | |
|     if (input == NULL) {
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     stream = xmlNewIOInputStream(ctxt, input, XML_CHAR_ENCODING_NONE);
 | |
|     if (stream == NULL) {
 | |
| 	xmlFreeParserInputBuffer(input);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     inputPush(ctxt, stream);
 | |
|     return (xmlDoRead(ctxt, URL, encoding, options, 1));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCtxtReadFile:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @filename:  a file or URL
 | |
|  * @encoding:  the document encoding, or NULL
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  *
 | |
|  * parse an XML file from the filesystem or the network.
 | |
|  * This reuses the existing @ctxt parser context
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| xmlDocPtr
 | |
| xmlCtxtReadFile(xmlParserCtxtPtr ctxt, const char *filename,
 | |
|                 const char *encoding, int options)
 | |
| {
 | |
|     xmlParserInputPtr stream;
 | |
| 
 | |
|     if (filename == NULL)
 | |
|         return (NULL);
 | |
|     if (ctxt == NULL)
 | |
|         return (NULL);
 | |
|     xmlInitParser();
 | |
| 
 | |
|     xmlCtxtReset(ctxt);
 | |
| 
 | |
|     stream = xmlLoadExternalEntity(filename, NULL, ctxt);
 | |
|     if (stream == NULL) {
 | |
|         return (NULL);
 | |
|     }
 | |
|     inputPush(ctxt, stream);
 | |
|     return (xmlDoRead(ctxt, NULL, encoding, options, 1));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCtxtReadMemory:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @buffer:  a pointer to a char array
 | |
|  * @size:  the size of the array
 | |
|  * @URL:  the base URL to use for the document
 | |
|  * @encoding:  the document encoding, or NULL
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  *
 | |
|  * parse an XML in-memory document and build a tree.
 | |
|  * This reuses the existing @ctxt parser context
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| xmlDocPtr
 | |
| xmlCtxtReadMemory(xmlParserCtxtPtr ctxt, const char *buffer, int size,
 | |
|                   const char *URL, const char *encoding, int options)
 | |
| {
 | |
|     xmlParserInputBufferPtr input;
 | |
|     xmlParserInputPtr stream;
 | |
| 
 | |
|     if (ctxt == NULL)
 | |
|         return (NULL);
 | |
|     if (buffer == NULL)
 | |
|         return (NULL);
 | |
|     xmlInitParser();
 | |
| 
 | |
|     xmlCtxtReset(ctxt);
 | |
| 
 | |
|     input = xmlParserInputBufferCreateMem(buffer, size, XML_CHAR_ENCODING_NONE);
 | |
|     if (input == NULL) {
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     stream = xmlNewIOInputStream(ctxt, input, XML_CHAR_ENCODING_NONE);
 | |
|     if (stream == NULL) {
 | |
| 	xmlFreeParserInputBuffer(input);
 | |
| 	return(NULL);
 | |
|     }
 | |
| 
 | |
|     inputPush(ctxt, stream);
 | |
|     return (xmlDoRead(ctxt, URL, encoding, options, 1));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCtxtReadFd:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @fd:  an open file descriptor
 | |
|  * @URL:  the base URL to use for the document
 | |
|  * @encoding:  the document encoding, or NULL
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  *
 | |
|  * parse an XML from a file descriptor and build a tree.
 | |
|  * This reuses the existing @ctxt parser context
 | |
|  * NOTE that the file descriptor will not be closed when the
 | |
|  *      reader is closed or reset.
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| xmlDocPtr
 | |
| xmlCtxtReadFd(xmlParserCtxtPtr ctxt, int fd,
 | |
|               const char *URL, const char *encoding, int options)
 | |
| {
 | |
|     xmlParserInputBufferPtr input;
 | |
|     xmlParserInputPtr stream;
 | |
| 
 | |
|     if (fd < 0)
 | |
|         return (NULL);
 | |
|     if (ctxt == NULL)
 | |
|         return (NULL);
 | |
|     xmlInitParser();
 | |
| 
 | |
|     xmlCtxtReset(ctxt);
 | |
| 
 | |
| 
 | |
|     input = xmlParserInputBufferCreateFd(fd, XML_CHAR_ENCODING_NONE);
 | |
|     if (input == NULL)
 | |
|         return (NULL);
 | |
|     input->closecallback = NULL;
 | |
|     stream = xmlNewIOInputStream(ctxt, input, XML_CHAR_ENCODING_NONE);
 | |
|     if (stream == NULL) {
 | |
|         xmlFreeParserInputBuffer(input);
 | |
|         return (NULL);
 | |
|     }
 | |
|     inputPush(ctxt, stream);
 | |
|     return (xmlDoRead(ctxt, URL, encoding, options, 1));
 | |
| }
 | |
| 
 | |
| /**
 | |
|  * xmlCtxtReadIO:
 | |
|  * @ctxt:  an XML parser context
 | |
|  * @ioread:  an I/O read function
 | |
|  * @ioclose:  an I/O close function
 | |
|  * @ioctx:  an I/O handler
 | |
|  * @URL:  the base URL to use for the document
 | |
|  * @encoding:  the document encoding, or NULL
 | |
|  * @options:  a combination of xmlParserOption
 | |
|  *
 | |
|  * parse an XML document from I/O functions and source and build a tree.
 | |
|  * This reuses the existing @ctxt parser context
 | |
|  *
 | |
|  * Returns the resulting document tree
 | |
|  */
 | |
| xmlDocPtr
 | |
| xmlCtxtReadIO(xmlParserCtxtPtr ctxt, xmlInputReadCallback ioread,
 | |
|               xmlInputCloseCallback ioclose, void *ioctx,
 | |
| 	      const char *URL,
 | |
|               const char *encoding, int options)
 | |
| {
 | |
|     xmlParserInputBufferPtr input;
 | |
|     xmlParserInputPtr stream;
 | |
| 
 | |
|     if (ioread == NULL)
 | |
|         return (NULL);
 | |
|     if (ctxt == NULL)
 | |
|         return (NULL);
 | |
|     xmlInitParser();
 | |
| 
 | |
|     xmlCtxtReset(ctxt);
 | |
| 
 | |
|     input = xmlParserInputBufferCreateIO(ioread, ioclose, ioctx,
 | |
|                                          XML_CHAR_ENCODING_NONE);
 | |
|     if (input == NULL) {
 | |
|         if (ioclose != NULL)
 | |
|             ioclose(ioctx);
 | |
|         return (NULL);
 | |
|     }
 | |
|     stream = xmlNewIOInputStream(ctxt, input, XML_CHAR_ENCODING_NONE);
 | |
|     if (stream == NULL) {
 | |
|         xmlFreeParserInputBuffer(input);
 | |
|         return (NULL);
 | |
|     }
 | |
|     inputPush(ctxt, stream);
 | |
|     return (xmlDoRead(ctxt, URL, encoding, options, 1));
 | |
| }
 | |
| 
 |