third_party/libxml/src/parser.c - Issue 1193533007: Upgrade to libxml 2.9.2 and libxslt 1.1.28

Unified Diff: third_party/libxml/src/parser.c

Issue 1193533007: Upgrade to libxml 2.9.2 and libxslt 1.1.28 (Closed) Base URL: https://chromium.googlesource.com/chromium/src.git@master

Patch Set: no iconv Created 5 years, 6 months ago

Use n/p to move between diff chunks; N/P to move between comments. Draft comments are only viewable by you.

Jump to:

View side-by-side diff with in-line comments

Download patch

Index: third_party/libxml/src/parser.c

diff --git a/third_party/libxml/src/parser.c b/third_party/libxml/src/parser.c

index 6ee55378f3fc4c125d923422f142980787004a3e..1d9396786ba7eca5d8e985d18e2679398243acd4 100644

--- a/third_party/libxml/src/parser.c

+++ b/third_party/libxml/src/parser.c

@@ -17,7 +17,7 @@

* parserInternals.c to reduce this file size.

* As much as possible the functions are associated with their relative

* production in the XML specification. A few productions defining the

- * different ranges of character are actually implanted either in

+ * different ranges of character are actually implanted either in

* parserInternals.h or parserInternals.c

* The DOM tree build is realized from the default SAX callbacks in

* the module SAX.c.

@@ -40,6 +40,7 @@

#endif

#include <stdlib.h>

+#include <limits.h>

#include <string.h>

#include <stdarg.h>

#include <libxml/xmlmemory.h>

@@ -79,6 +80,12 @@

#ifdef HAVE_ZLIB_H

#include <zlib.h>

#endif

+#ifdef HAVE_LZMA_H

+#include <lzma.h>

+#endif

+#include "buf.h"

+#include "enc.h"

static void

xmlFatalErr(xmlParserCtxtPtr ctxt, xmlParserErrors error, const char *info);

@@ -114,16 +121,56 @@ xmlCreateEntityParserCtxtInternal(const xmlChar *URL, const xmlChar *ID,

* parser option.

static int

-xmlParserEntityCheck(xmlParserCtxtPtr ctxt, unsigned long size,

- xmlEntityPtr ent)

+xmlParserEntityCheck(xmlParserCtxtPtr ctxt, size_t size,

+ xmlEntityPtr ent, size_t replacement)

{

- unsigned long consumed = 0;

+ size_t consumed = 0;

if ((ctxt == NULL) || (ctxt->options & XML_PARSE_HUGE))

return (0);

if (ctxt->lastError.code == XML_ERR_ENTITY_LOOP)

return (1);

- if (size != 0) {

+ /*

+ * This may look absurd but is needed to detect

+ * entities problems

+ */

+ if ((ent != NULL) && (ent->etype != XML_INTERNAL_PREDEFINED_ENTITY) &&

+ (ent->content != NULL) && (ent->checked == 0)) {

+ unsigned long oldnbent = ctxt->nbentities;

+ xmlChar *rep;

+ ent->checked = 1;

+ rep = xmlStringDecodeEntities(ctxt, ent->content,

+ XML_SUBSTITUTE_REF, 0, 0, 0);

+ ent->checked = (ctxt->nbentities - oldnbent + 1) * 2;

+ if (rep != NULL) {

+ if (xmlStrchr(rep, '<'))

+ ent->checked |= 1;

+ xmlFree(rep);

+ rep = NULL;

+ }

+ if (replacement != 0) {

+ if (replacement < XML_MAX_TEXT_LENGTH)

+ return(0);

+ /*

+ * If the volume of entity copy reaches 10 times the

+ * amount of parsed data and over the large text threshold

+ * then that's very likely to be an abuse.

+ */

+ if (ctxt->input != NULL) {

+ consumed = ctxt->input->consumed +

+ (ctxt->input->cur - ctxt->input->base);

+ }

+ consumed += ctxt->sizeentities;

+ if (replacement < XML_PARSER_NON_LINEAR * consumed)

+ return(0);

+ } else if (size != 0) {

* Do the check based on the replacement size of the entity

@@ -146,7 +193,7 @@ xmlParserEntityCheck(xmlParserCtxtPtr ctxt, unsigned long size,

* use the number of parsed entities in the replacement

- size = ent->checked;

+ size = ent->checked / 2;

* The amount of data parsed counting entities size only once

@@ -165,11 +212,13 @@ xmlParserEntityCheck(xmlParserCtxtPtr ctxt, unsigned long size,

return (0);

} else {

- * strange we got no data for checking just return

+ * strange we got no data for checking

- return (0);

+ if (((ctxt->lastError.code != XML_ERR_UNDECLARED_ENTITY) &&

+ (ctxt->lastError.code != XML_WAR_UNDECLARED_ENTITY)) ||

+ (ctxt->nbentities <= 10000))

+ return (0);

}

xmlFatalErr(ctxt, XML_ERR_ENTITY_LOOP, NULL);

return (1);

}

@@ -191,12 +240,24 @@ unsigned int xmlParserMaxDepth = 256;

#define XML_PARSER_BUFFER_SIZE 100

#define SAX_COMPAT_MODE BAD_CAST "SAX compatibility mode document"

+/**

+ * XML_PARSER_CHUNK_SIZE

+ *

+ * When calling GROW that's the minimal amount of data

+ * the parser expected to have received. It is not a hard

+ * limit but an optimization when reading strings like Names

+ * It is not strictly needed as long as inputs available characters

+ * are followed by 0, which should be provided by the I/O level

+ */

+#define XML_PARSER_CHUNK_SIZE 100

* List of XML prefixed PI allowed by W3C specs

static const char *xmlW3CPIs[] = {

"xml-stylesheet",

+ "xml-model",

NULL

};

@@ -229,7 +290,7 @@ xmlLoadEntityContent(xmlParserCtxtPtr ctxt, xmlEntityPtr entity);

/************************************************************************

* *

- * Some factorized error routines *

+ * Some factorized error routines *

* *

************************************************************************/

@@ -281,193 +342,201 @@ static void

xmlFatalErr(xmlParserCtxtPtr ctxt, xmlParserErrors error, const char *info)

{

const char *errmsg;

+ char errstr[129] = "";

if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&

(ctxt->instate == XML_PARSER_EOF))

return;

switch (error) {

case XML_ERR_INVALID_HEX_CHARREF:

- errmsg = "CharRef: invalid hexadecimal value\n";

+ errmsg = "CharRef: invalid hexadecimal value";

break;

case XML_ERR_INVALID_DEC_CHARREF:

- errmsg = "CharRef: invalid decimal value\n";

+ errmsg = "CharRef: invalid decimal value";

break;

case XML_ERR_INVALID_CHARREF:

- errmsg = "CharRef: invalid value\n";

+ errmsg = "CharRef: invalid value";

break;

case XML_ERR_INTERNAL_ERROR:

errmsg = "internal error";

break;

case XML_ERR_PEREF_AT_EOF:

- errmsg = "PEReference at end of document\n";

+ errmsg = "PEReference at end of document";

break;

case XML_ERR_PEREF_IN_PROLOG:

- errmsg = "PEReference in prolog\n";

+ errmsg = "PEReference in prolog";

break;

case XML_ERR_PEREF_IN_EPILOG:

- errmsg = "PEReference in epilog\n";

+ errmsg = "PEReference in epilog";

break;

case XML_ERR_PEREF_NO_NAME:

- errmsg = "PEReference: no name\n";

+ errmsg = "PEReference: no name";

break;

case XML_ERR_PEREF_SEMICOL_MISSING:

- errmsg = "PEReference: expecting ';'\n";

+ errmsg = "PEReference: expecting ';'";

break;

case XML_ERR_ENTITY_LOOP:

- errmsg = "Detected an entity reference loop\n";

+ errmsg = "Detected an entity reference loop";

break;

case XML_ERR_ENTITY_NOT_STARTED:

- errmsg = "EntityValue: \" or ' expected\n";

+ errmsg = "EntityValue: \" or ' expected";

break;

case XML_ERR_ENTITY_PE_INTERNAL:

- errmsg = "PEReferences forbidden in internal subset\n";

+ errmsg = "PEReferences forbidden in internal subset";

break;

case XML_ERR_ENTITY_NOT_FINISHED:

- errmsg = "EntityValue: \" or ' expected\n";

+ errmsg = "EntityValue: \" or ' expected";

break;

case XML_ERR_ATTRIBUTE_NOT_STARTED:

- errmsg = "AttValue: \" or ' expected\n";

+ errmsg = "AttValue: \" or ' expected";

break;

case XML_ERR_LT_IN_ATTRIBUTE:

- errmsg = "Unescaped '<' not allowed in attributes values\n";

+ errmsg = "Unescaped '<' not allowed in attributes values";

break;

case XML_ERR_LITERAL_NOT_STARTED:

- errmsg = "SystemLiteral \" or ' expected\n";

+ errmsg = "SystemLiteral \" or ' expected";

break;

case XML_ERR_LITERAL_NOT_FINISHED:

- errmsg = "Unfinished System or Public ID \" or ' expected\n";

+ errmsg = "Unfinished System or Public ID \" or ' expected";

break;

case XML_ERR_MISPLACED_CDATA_END:

- errmsg = "Sequence ']]>' not allowed in content\n";

+ errmsg = "Sequence ']]>' not allowed in content";

break;

case XML_ERR_URI_REQUIRED:

- errmsg = "SYSTEM or PUBLIC, the URI is missing\n";

+ errmsg = "SYSTEM or PUBLIC, the URI is missing";

break;

case XML_ERR_PUBID_REQUIRED:

- errmsg = "PUBLIC, the Public Identifier is missing\n";

+ errmsg = "PUBLIC, the Public Identifier is missing";

break;

case XML_ERR_HYPHEN_IN_COMMENT:

- errmsg = "Comment must not contain '--' (double-hyphen)\n";

+ errmsg = "Comment must not contain '--' (double-hyphen)";

break;

case XML_ERR_PI_NOT_STARTED:

- errmsg = "xmlParsePI : no target name\n";

+ errmsg = "xmlParsePI : no target name";

break;

case XML_ERR_RESERVED_XML_NAME:

- errmsg = "Invalid PI name\n";

+ errmsg = "Invalid PI name";

break;

case XML_ERR_NOTATION_NOT_STARTED:

- errmsg = "NOTATION: Name expected here\n";

+ errmsg = "NOTATION: Name expected here";

break;

case XML_ERR_NOTATION_NOT_FINISHED:

- errmsg = "'>' required to close NOTATION declaration\n";

+ errmsg = "'>' required to close NOTATION declaration";

break;

case XML_ERR_VALUE_REQUIRED:

- errmsg = "Entity value required\n";

+ errmsg = "Entity value required";

break;

case XML_ERR_URI_FRAGMENT:

errmsg = "Fragment not allowed";

break;

case XML_ERR_ATTLIST_NOT_STARTED:

- errmsg = "'(' required to start ATTLIST enumeration\n";

+ errmsg = "'(' required to start ATTLIST enumeration";

break;

case XML_ERR_NMTOKEN_REQUIRED:

- errmsg = "NmToken expected in ATTLIST enumeration\n";

+ errmsg = "NmToken expected in ATTLIST enumeration";

break;

case XML_ERR_ATTLIST_NOT_FINISHED:

- errmsg = "')' required to finish ATTLIST enumeration\n";

+ errmsg = "')' required to finish ATTLIST enumeration";

break;

case XML_ERR_MIXED_NOT_STARTED:

- errmsg = "MixedContentDecl : '|' or ')*' expected\n";

+ errmsg = "MixedContentDecl : '|' or ')*' expected";

break;

case XML_ERR_PCDATA_REQUIRED:

- errmsg = "MixedContentDecl : '#PCDATA' expected\n";

+ errmsg = "MixedContentDecl : '#PCDATA' expected";

break;

case XML_ERR_ELEMCONTENT_NOT_STARTED:

- errmsg = "ContentDecl : Name or '(' expected\n";

+ errmsg = "ContentDecl : Name or '(' expected";

break;

case XML_ERR_ELEMCONTENT_NOT_FINISHED:

- errmsg = "ContentDecl : ',' '|' or ')' expected\n";

+ errmsg = "ContentDecl : ',' '|' or ')' expected";

break;

case XML_ERR_PEREF_IN_INT_SUBSET:

errmsg =

- "PEReference: forbidden within markup decl in internal subset\n";

+ "PEReference: forbidden within markup decl in internal subset";

break;

case XML_ERR_GT_REQUIRED:

- errmsg = "expected '>'\n";

+ errmsg = "expected '>'";

break;

case XML_ERR_CONDSEC_INVALID:

- errmsg = "XML conditional section '[' expected\n";

+ errmsg = "XML conditional section '[' expected";

break;

case XML_ERR_EXT_SUBSET_NOT_FINISHED:

- errmsg = "Content error in the external subset\n";

+ errmsg = "Content error in the external subset";

break;

case XML_ERR_CONDSEC_INVALID_KEYWORD:

errmsg =

- "conditional section INCLUDE or IGNORE keyword expected\n";

+ "conditional section INCLUDE or IGNORE keyword expected";

break;

case XML_ERR_CONDSEC_NOT_FINISHED:

- errmsg = "XML conditional section not closed\n";

+ errmsg = "XML conditional section not closed";

break;

case XML_ERR_XMLDECL_NOT_STARTED:

- errmsg = "Text declaration '<?xml' required\n";

+ errmsg = "Text declaration '<?xml' required";

break;

case XML_ERR_XMLDECL_NOT_FINISHED:

- errmsg = "parsing XML declaration: '?>' expected\n";

+ errmsg = "parsing XML declaration: '?>' expected";

break;

case XML_ERR_EXT_ENTITY_STANDALONE:

- errmsg = "external parsed entities cannot be standalone\n";

+ errmsg = "external parsed entities cannot be standalone";

break;

case XML_ERR_ENTITYREF_SEMICOL_MISSING:

- errmsg = "EntityRef: expecting ';'\n";

+ errmsg = "EntityRef: expecting ';'";

break;

case XML_ERR_DOCTYPE_NOT_FINISHED:

- errmsg = "DOCTYPE improperly terminated\n";

+ errmsg = "DOCTYPE improperly terminated";

break;

case XML_ERR_LTSLASH_REQUIRED:

- errmsg = "EndTag: '</' not found\n";

+ errmsg = "EndTag: '</' not found";

break;

case XML_ERR_EQUAL_REQUIRED:

- errmsg = "expected '='\n";

+ errmsg = "expected '='";

break;

case XML_ERR_STRING_NOT_CLOSED:

- errmsg = "String not closed expecting \" or '\n";

+ errmsg = "String not closed expecting \" or '";

break;

case XML_ERR_STRING_NOT_STARTED:

- errmsg = "String not started expecting ' or \"\n";

+ errmsg = "String not started expecting ' or \"";

break;

case XML_ERR_ENCODING_NAME:

- errmsg = "Invalid XML encoding name\n";

+ errmsg = "Invalid XML encoding name";

break;

case XML_ERR_STANDALONE_VALUE:

- errmsg = "standalone accepts only 'yes' or 'no'\n";

+ errmsg = "standalone accepts only 'yes' or 'no'";

break;

case XML_ERR_DOCUMENT_EMPTY:

- errmsg = "Document is empty\n";

+ errmsg = "Document is empty";

break;

case XML_ERR_DOCUMENT_END:

- errmsg = "Extra content at the end of the document\n";

+ errmsg = "Extra content at the end of the document";

break;

case XML_ERR_NOT_WELL_BALANCED:

- errmsg = "chunk is not well balanced\n";

+ errmsg = "chunk is not well balanced";

break;

case XML_ERR_EXTRA_CONTENT:

- errmsg = "extra content at the end of well balanced chunk\n";

+ errmsg = "extra content at the end of well balanced chunk";

break;

case XML_ERR_VERSION_MISSING:

- errmsg = "Malformed declaration expecting version\n";

+ errmsg = "Malformed declaration expecting version";

+ break;

+ case XML_ERR_NAME_TOO_LONG:

+ errmsg = "Name too long use XML_PARSE_HUGE option";

break;

#if 0

case:

- errmsg = "\n";

+ errmsg = "";

break;

#endif

default:

- errmsg = "Unregistered error message\n";

+ errmsg = "Unregistered error message";

}

+ if (info == NULL)

+ snprintf(errstr, 128, "%s\n", errmsg);

+ else

+ snprintf(errstr, 128, "%s: %%s\n", errmsg);

if (ctxt != NULL)

ctxt->errNo = error;

__xmlRaiseError(NULL, NULL, NULL, ctxt, NULL, XML_FROM_PARSER, error,

- XML_ERR_FATAL, NULL, 0, info, NULL, NULL, 0, 0, errmsg,

+ XML_ERR_FATAL, NULL, 0, info, NULL, NULL, 0, 0, &errstr[0],

info);

if (ctxt != NULL) {

ctxt->wellFormed = 0;

@@ -622,7 +691,7 @@ xmlFatalErrMsgInt(xmlParserCtxtPtr ctxt, xmlParserErrors error,

static void

xmlFatalErrMsgStrIntStr(xmlParserCtxtPtr ctxt, xmlParserErrors error,

- const char *msg, const xmlChar *str1, int val,

+ const char *msg, const xmlChar *str1, int val,

const xmlChar *str2)

{

if ((ctxt != NULL) && (ctxt->disableSAX != 0) &&

@@ -731,7 +800,7 @@ xmlNsErr(xmlParserCtxtPtr ctxt, xmlParserErrors error,

* @info1: extra information string

* @info2: extra information string

- * Handle a fatal parser error, i.e. violating Well-Formedness constraints

+ * Handle a namespace warning error

static void

xmlNsWarn(xmlParserCtxtPtr ctxt, xmlParserErrors error,

@@ -750,7 +819,7 @@ xmlNsWarn(xmlParserCtxtPtr ctxt, xmlParserErrors error,

/************************************************************************

* *

- * Library wide options *

+ * Library wide options *

* *

************************************************************************/

@@ -954,6 +1023,12 @@ xmlHasFeature(xmlFeature feature)

#else

return(0);

#endif

+ case XML_WITH_LZMA:

+#ifdef LIBXML_LZMA_ENABLED

+ return(1);

+#else

+ return(0);

+#endif

case XML_WITH_ICU:

#ifdef LIBXML_ICU_ENABLED

return(1);

@@ -968,7 +1043,7 @@ xmlHasFeature(xmlFeature feature)

/************************************************************************

* *

- * SAX2 defaulted attributes handling *

+ * SAX2 defaulted attributes handling *

* *

************************************************************************/

@@ -992,8 +1067,8 @@ xmlDetectSAX2(xmlParserCtxtPtr ctxt) {

ctxt->str_xml = xmlDictLookup(ctxt->dict, BAD_CAST "xml", 3);

ctxt->str_xmlns = xmlDictLookup(ctxt->dict, BAD_CAST "xmlns", 5);

ctxt->str_xml_ns = xmlDictLookup(ctxt->dict, XML_XML_NAMESPACE, 36);

- if ((ctxt->str_xml==NULL) || (ctxt->str_xmlns==NULL) ||

- (ctxt->str_xml_ns == NULL)) {

+ if ((ctxt->str_xml==NULL) || (ctxt->str_xmlns==NULL) ||

+ (ctxt->str_xml_ns == NULL)) {

xmlErrMemory(ctxt, NULL);

}

@@ -1303,60 +1378,182 @@ xmlCleanSpecialAttr(xmlParserCtxtPtr ctxt)

* [37] UserCode ::= ('x' | 'X') '-' ([a-z] | [A-Z])+

* [38] Subcode ::= ([a-z] | [A-Z])+

+ * The current REC reference the sucessors of RFC 1766, currently 5646

+ *

+ * http://www.rfc-editor.org/rfc/rfc5646.txt

+ * langtag = language

+ * ["-" script]

+ * ["-" region]

+ * *("-" variant)

+ * *("-" extension)

+ * ["-" privateuse]

+ * language = 2*3ALPHA ; shortest ISO 639 code

+ * ["-" extlang] ; sometimes followed by

+ * ; extended language subtags

+ * / 4ALPHA ; or reserved for future use

+ * / 5*8ALPHA ; or registered language subtag

+ *

+ * extlang = 3ALPHA ; selected ISO 639 codes

+ * *2("-" 3ALPHA) ; permanently reserved

+ *

+ * script = 4ALPHA ; ISO 15924 code

+ *

+ * region = 2ALPHA ; ISO 3166-1 code

+ * / 3DIGIT ; UN M.49 code

+ *

+ * variant = 5*8alphanum ; registered variants

+ * / (DIGIT 3alphanum)

+ *

+ * extension = singleton 1*("-" (2*8alphanum))

+ *

+ * ; Single alphanumerics

+ * ; "x" reserved for private use

+ * singleton = DIGIT ; 0 - 9

+ * / %x41-57 ; A - W

+ * / %x59-5A ; Y - Z

+ * / %x61-77 ; a - w

+ * / %x79-7A ; y - z

+ *

+ * it sounds right to still allow Irregular i-xxx IANA and user codes too

+ * The parser below doesn't try to cope with extension or privateuse

+ * that could be added but that's not interoperable anyway

+ *

* Returns 1 if correct 0 otherwise

**/

int

xmlCheckLanguageID(const xmlChar * lang)

{

- const xmlChar *cur = lang;

+ const xmlChar *cur = lang, *nxt;

if (cur == NULL)

return (0);

if (((cur[0] == 'i') && (cur[1] == '-')) ||

- ((cur[0] == 'I') && (cur[1] == '-'))) {

+ ((cur[0] == 'I') && (cur[1] == '-')) ||

+ ((cur[0] == 'x') && (cur[1] == '-')) ||

+ ((cur[0] == 'X') && (cur[1] == '-'))) {

- * IANA code

+ * Still allow IANA code and user code which were coming

+ * from the previous version of the XML-1.0 specification

+ * it's deprecated but we should not fail

cur += 2;

- while (((cur[0] >= 'A') && (cur[0] <= 'Z')) || /* non input consuming */

+ while (((cur[0] >= 'A') && (cur[0] <= 'Z')) ||

((cur[0] >= 'a') && (cur[0] <= 'z')))

cur++;

- } else if (((cur[0] == 'x') && (cur[1] == '-')) ||

- ((cur[0] == 'X') && (cur[1] == '-'))) {

- /*

- * User code

- */

- cur += 2;

- while (((cur[0] >= 'A') && (cur[0] <= 'Z')) || /* non input consuming */

- ((cur[0] >= 'a') && (cur[0] <= 'z')))

- cur++;

- } else if (((cur[0] >= 'A') && (cur[0] <= 'Z')) ||

- ((cur[0] >= 'a') && (cur[0] <= 'z'))) {

+ return(cur[0] == 0);

+ }

+ nxt = cur;

+ while (((nxt[0] >= 'A') && (nxt[0] <= 'Z')) ||

+ ((nxt[0] >= 'a') && (nxt[0] <= 'z')))

+ nxt++;

+ if (nxt - cur >= 4) {

- * ISO639

+ * Reserved

- cur++;

- if (((cur[0] >= 'A') && (cur[0] <= 'Z')) ||

- ((cur[0] >= 'a') && (cur[0] <= 'z')))

- cur++;

- else

- return (0);

- } else

- return (0);

- while (cur[0] != 0) { /* non input consuming */

- if (cur[0] != '-')

- return (0);

- cur++;

- if (((cur[0] >= 'A') && (cur[0] <= 'Z')) ||

- ((cur[0] >= 'a') && (cur[0] <= 'z')))

- cur++;

- else

- return (0);

- while (((cur[0] >= 'A') && (cur[0] <= 'Z')) || /* non input consuming */

- ((cur[0] >= 'a') && (cur[0] <= 'z')))

- cur++;

+ if ((nxt - cur > 8) || (nxt[0] != 0))

+ return(0);

+ return(1);

}

+ if (nxt - cur < 2)

+ return(0);

+ /* we got an ISO 639 code */

+ if (nxt[0] == 0)

+ return(1);

+ if (nxt[0] != '-')

+ return(0);

+ nxt++;

+ cur = nxt;

+ /* now we can have extlang or script or region or variant */

+ if ((nxt[0] >= '0') && (nxt[0] <= '9'))

+ goto region_m49;

+ while (((nxt[0] >= 'A') && (nxt[0] <= 'Z')) ||

+ ((nxt[0] >= 'a') && (nxt[0] <= 'z')))

+ nxt++;

+ if (nxt - cur == 4)

+ goto script;

+ if (nxt - cur == 2)

+ goto region;

+ if ((nxt - cur >= 5) && (nxt - cur <= 8))

+ goto variant;

+ if (nxt - cur != 3)

+ return(0);

+ /* we parsed an extlang */

+ if (nxt[0] == 0)

+ return(1);

+ if (nxt[0] != '-')

+ return(0);

+ nxt++;

+ cur = nxt;

+ /* now we can have script or region or variant */

+ if ((nxt[0] >= '0') && (nxt[0] <= '9'))

+ goto region_m49;

+ while (((nxt[0] >= 'A') && (nxt[0] <= 'Z')) ||

+ ((nxt[0] >= 'a') && (nxt[0] <= 'z')))

+ nxt++;

+ if (nxt - cur == 2)

+ goto region;

+ if ((nxt - cur >= 5) && (nxt - cur <= 8))

+ goto variant;

+ if (nxt - cur != 4)

+ return(0);

+ /* we parsed a script */

+script:

+ if (nxt[0] == 0)

+ return(1);

+ if (nxt[0] != '-')

+ return(0);

+ nxt++;

+ cur = nxt;

+ /* now we can have region or variant */

+ if ((nxt[0] >= '0') && (nxt[0] <= '9'))

+ goto region_m49;

+ while (((nxt[0] >= 'A') && (nxt[0] <= 'Z')) ||

+ ((nxt[0] >= 'a') && (nxt[0] <= 'z')))

+ nxt++;

+ if ((nxt - cur >= 5) && (nxt - cur <= 8))

+ goto variant;

+ if (nxt - cur != 2)

+ return(0);

+ /* we parsed a region */

+region:

+ if (nxt[0] == 0)

+ return(1);

+ if (nxt[0] != '-')

+ return(0);

+ nxt++;

+ cur = nxt;

+ /* now we can just have a variant */

+ while (((nxt[0] >= 'A') && (nxt[0] <= 'Z')) ||

+ ((nxt[0] >= 'a') && (nxt[0] <= 'z')))

+ nxt++;

+ if ((nxt - cur < 5) || (nxt - cur > 8))

+ return(0);

+ /* we parsed a variant */

+variant:

+ if (nxt[0] == 0)

+ return(1);

+ if (nxt[0] != '-')

+ return(0);

+ /* extensions and private use subtags not checked */

return (1);

+region_m49:

+ if (((nxt[1] >= '0') && (nxt[1] <= '9')) &&

+ ((nxt[2] >= '0') && (nxt[2] <= '9'))) {

+ nxt += 3;

+ goto region;

+ }

+ return(0);

}

/************************************************************************

@@ -1385,7 +1582,7 @@ nsPush(xmlParserCtxtPtr ctxt, const xmlChar *prefix, const xmlChar *URL)

{

if (ctxt->options & XML_PARSE_NSCLEAN) {

int i;

- for (i = 0;i < ctxt->nsNr;i += 2) {

+ for (i = ctxt->nsNr - 2;i >= 0;i -= 2) {

if (ctxt->nsTab[i] == prefix) {

/* in scope */

if (ctxt->nsTab[i + 1] == URL)

@@ -1697,15 +1894,14 @@ namePush(xmlParserCtxtPtr ctxt, const xmlChar * value)

if (ctxt->nameNr >= ctxt->nameMax) {

const xmlChar * *tmp;

- ctxt->nameMax *= 2;

tmp = (const xmlChar * *) xmlRealloc((xmlChar * *)ctxt->nameTab,

- ctxt->nameMax *

+ ctxt->nameMax * 2 *

sizeof(ctxt->nameTab[0]));

if (tmp == NULL) {

- ctxt->nameMax /= 2;

goto mem_error;

}

ctxt->nameTab = tmp;

+ ctxt->nameMax *= 2;

}

ctxt->nameTab[ctxt->nameNr] = value;

ctxt->name = value;

@@ -1791,7 +1987,7 @@ static int spacePop(xmlParserCtxtPtr ctxt) {

* to compare on ASCII based substring.

* SKIP(n) Skip n xmlChar, and must also be used only to skip ASCII defined

* strings without newlines within the parser.

- * NEXT1(l) Skip 1 xmlChar, and must also be used only to skip 1 non-newline ASCII

+ * NEXT1(l) Skip 1 xmlChar, and must also be used only to skip 1 non-newline ASCII

* defined char within the parser.

* Clean macros, not dependent of an ASCII context, expect UTF-8 encoding

@@ -1840,10 +2036,10 @@ static int spacePop(xmlParserCtxtPtr ctxt) {

#define SKIPL(val) do { \

int skipl; \

for(skipl=0; skipl<val; skipl++) { \

- if (*(ctxt->input->cur) == '\n') { \

+ if (*(ctxt->input->cur) == '\n') { \

ctxt->input->line++; ctxt->input->col = 1; \

- } else ctxt->input->col++; \

- ctxt->nbChars++; \

+ } else ctxt->input->col++; \

+ ctxt->nbChars++; \

ctxt->input->cur++; \

} \

if (*ctxt->input->cur == '%') xmlParserHandlePEReference(ctxt); \

@@ -1869,6 +2065,16 @@ static void xmlSHRINK (xmlParserCtxtPtr ctxt) {

xmlGROW (ctxt);

static void xmlGROW (xmlParserCtxtPtr ctxt) {

+ unsigned long curEnd = ctxt->input->end - ctxt->input->cur;

+ unsigned long curBase = ctxt->input->cur - ctxt->input->base;

+ if (((curEnd > (unsigned long) XML_MAX_LOOKUP_LIMIT) ||

+ (curBase > (unsigned long) XML_MAX_LOOKUP_LIMIT)) &&

+ ((ctxt->input->buf) && (ctxt->input->buf->readcallback != (xmlInputReadCallback) xmlNop)) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErr(ctxt, XML_ERR_INTERNAL_ERROR, "Huge input lookup");

+ ctxt->instate = XML_PARSER_EOF;

+ }

xmlParserInputGrow(ctxt->input, INPUT_CHUNK);

if ((ctxt->input->cur != NULL) && (*ctxt->input->cur == 0) &&

(xmlParserInputGrow(ctxt->input, INPUT_CHUNK) <= 0))

@@ -1929,6 +2135,8 @@ xmlSkipBlankChars(xmlParserCtxtPtr ctxt) {

while (IS_BLANK_CH(*cur)) {

if (*cur == '\n') {

ctxt->input->line++; ctxt->input->col = 1;

+ } else {

+ ctxt->input->col++;

}

cur++;

res++;

@@ -2030,7 +2238,7 @@ xmlPushInput(xmlParserCtxtPtr ctxt, xmlParserInputPtr input) {

* [ WFC: Legal Character ]

* Characters referred to using character references must match the

- * production for Char.

+ * production for Char.

* Returns the value parsed (as an int), 0 in case of error

@@ -2054,7 +2262,7 @@ xmlParseCharRef(xmlParserCtxtPtr ctxt) {

if (ctxt->instate == XML_PARSER_EOF)

return(0);

}

- if ((RAW >= '0') && (RAW <= '9'))

+ if ((RAW >= '0') && (RAW <= '9'))

val = val * 16 + (CUR - '0');

else if ((RAW >= 'a') && (RAW <= 'f') && (count < 20))

val = val * 16 + (CUR - 'a') + 10;

@@ -2087,7 +2295,7 @@ xmlParseCharRef(xmlParserCtxtPtr ctxt) {

if (ctxt->instate == XML_PARSER_EOF)

return(0);

}

- if ((RAW >= '0') && (RAW <= '9'))

+ if ((RAW >= '0') && (RAW <= '9'))

val = val * 10 + (CUR - '0');

else {

xmlFatalErr(ctxt, XML_ERR_INVALID_DEC_CHARREF, NULL);

@@ -2113,7 +2321,7 @@ xmlParseCharRef(xmlParserCtxtPtr ctxt) {

* [ WFC: Legal Character ]

* Characters referred to using character references must match the

- * production for Char.

+ * production for Char.

if ((IS_CHAR(val) && (outofrange == 0))) {

return(val);

@@ -2138,7 +2346,7 @@ xmlParseCharRef(xmlParserCtxtPtr ctxt) {

* [ WFC: Legal Character ]

* Characters referred to using character references must match the

- * production for Char.

+ * production for Char.

* Returns the value parsed (as an int), 0 in case of error, str will be

* updated to the current value of the index

@@ -2157,7 +2365,7 @@ xmlParseStringCharRef(xmlParserCtxtPtr ctxt, const xmlChar **str) {

ptr += 3;

cur = *ptr;

while (cur != ';') { /* Non input consuming loop */

- if ((cur >= '0') && (cur <= '9'))

+ if ((cur >= '0') && (cur <= '9'))

val = val * 16 + (cur - '0');

else if ((cur >= 'a') && (cur <= 'f'))

val = val * 16 + (cur - 'a') + 10;

@@ -2180,7 +2388,7 @@ xmlParseStringCharRef(xmlParserCtxtPtr ctxt, const xmlChar **str) {

ptr += 2;

cur = *ptr;

while (cur != ';') { /* Non input consuming loops */

- if ((cur >= '0') && (cur <= '9'))

+ if ((cur >= '0') && (cur <= '9'))

val = val * 10 + (cur - '0');

else {

xmlFatalErr(ctxt, XML_ERR_INVALID_DEC_CHARREF, NULL);

@@ -2204,7 +2412,7 @@ xmlParseStringCharRef(xmlParserCtxtPtr ctxt, const xmlChar **str) {

* [ WFC: Legal Character ]

* Characters referred to using character references must match the

- * production for Char.

+ * production for Char.

if ((IS_CHAR(val) && (outofrange == 0))) {

return(val);

@@ -2226,9 +2434,9 @@ xmlParseStringCharRef(xmlParserCtxtPtr ctxt, const xmlChar **str) {

* Returns the new input stream or NULL

static void deallocblankswrapper (xmlChar *str) {xmlFree(str);}

static xmlParserInputPtr

xmlNewBlanksWrapperInputStream(xmlParserCtxtPtr ctxt, xmlEntityPtr entity) {

xmlParserInputPtr input;

@@ -2251,7 +2459,7 @@ xmlNewBlanksWrapperInputStream(xmlParserCtxtPtr ctxt, xmlEntityPtr entity) {

if (buffer == NULL) {

xmlErrMemory(ctxt, NULL);

xmlFree(input);

- return(NULL);

+ return(NULL);

}

buffer [0] = ' ';

buffer [1] = '%';

@@ -2270,12 +2478,12 @@ xmlNewBlanksWrapperInputStream(xmlParserCtxtPtr ctxt, xmlEntityPtr entity) {

/**

* xmlParserHandlePEReference:

* @ctxt: the parser context

- *

+ *

* [69] PEReference ::= '%' Name ';'

* [ WFC: No Recursion ]

* A parsed entity must not contain a recursive

- * reference to itself, either directly or indirectly.

+ * reference to itself, either directly or indirectly.

* [ WFC: Entity Declared ]

* In a document without any DTD, a document with only an internal DTD

@@ -2293,9 +2501,9 @@ xmlNewBlanksWrapperInputStream(xmlParserCtxtPtr ctxt, xmlEntityPtr entity) {

* NOTE: misleading but this is handled.

* A PEReference may have been detected in the current input stream

- * the handling is done accordingly to

+ * the handling is done accordingly to

* http://www.w3.org/TR/REC-xml#entproc

- * i.e.

+ * i.e.

* - Included in literal in entity values

* - Included as Parameter Entity reference within DTDs

@@ -2375,7 +2583,7 @@ xmlParserHandlePEReference(xmlParserCtxtPtr ctxt) {

if (ctxt->instate == XML_PARSER_EOF)

return;

if (entity == NULL) {

* [ WFC: Entity Declared ]

* In a document without any DTD, a document with only an

@@ -2401,12 +2609,13 @@ xmlParserHandlePEReference(xmlParserCtxtPtr ctxt) {

xmlValidityError(ctxt, XML_WAR_UNDECLARED_ENTITY,

"PEReference: %%%s; not found\n",

name, NULL);

- } else

+ } else

xmlWarningMsg(ctxt, XML_WAR_UNDECLARED_ENTITY,

"PEReference: %%%s; not found\n",

name, NULL);

ctxt->valid = 0;

}

+ xmlParserEntityCheck(ctxt, 0, NULL, 0);

} else if (ctxt->input->free != deallocblankswrapper) {

input = xmlNewBlanksWrapperInputStream(ctxt, entity);

if (xmlPushInput(ctxt, input) < 0)

@@ -2418,6 +2627,23 @@ xmlParserHandlePEReference(xmlParserCtxtPtr ctxt) {

xmlCharEncoding enc;

+ * Note: external parameter entities will not be loaded, it

+ * is not required for a non-validating parser, unless the

+ * option of validating, or substituting entities were

+ * given. Doing so is far more secure as the parser will

+ * only process data coming from the document entity by

+ * default.

+ */

+ if ((entity->etype == XML_EXTERNAL_PARAMETER_ENTITY) &&

+ ((ctxt->options & XML_PARSE_NOENT) == 0) &&

+ ((ctxt->options & XML_PARSE_DTDVALID) == 0) &&

+ ((ctxt->options & XML_PARSE_DTDLOAD) == 0) &&

+ ((ctxt->options & XML_PARSE_DTDATTR) == 0) &&

+ (ctxt->replaceEntities == 0) &&

+ (ctxt->validate == 0))

+ return;

+ /*

* handle the extra spaces added before and after

* c.f. http://www.w3.org/TR/REC-xml#as-PE

* this is done independently.

@@ -2426,7 +2652,7 @@ xmlParserHandlePEReference(xmlParserCtxtPtr ctxt) {

if (xmlPushInput(ctxt, input) < 0)

return;

- /*

+ /*

* Get the 4 first bytes and decode the charset

* if enc != XML_CHAR_ENCODING_NONE

* plug some encoding conversion routines.

@@ -2468,15 +2694,17 @@ xmlParserHandlePEReference(xmlParserCtxtPtr ctxt) {

* Macro used to grow the current buffer.

+ * buffer##_size is expected to be a size_t

+ * mem_error: is expected to handle memory allocation failures

#define growBuffer(buffer, n) { \

xmlChar *tmp; \

- buffer##_size *= 2; \

- buffer##_size += n; \

- tmp = (xmlChar *) \

- xmlRealloc(buffer, buffer##_size * sizeof(xmlChar)); \

+ size_t new_size = buffer##_size * 2 + n; \

+ if (new_size < buffer##_size) goto mem_error; \

+ tmp = (xmlChar *) xmlRealloc(buffer, new_size); \

if (tmp == NULL) goto mem_error; \

buffer = tmp; \

+ buffer##_size = new_size; \

}

/**

@@ -2488,7 +2716,7 @@ xmlParserHandlePEReference(xmlParserCtxtPtr ctxt) {

* @end: an end marker xmlChar, 0 if none

* @end2: an end marker xmlChar, 0 if none

* @end3: an end marker xmlChar, 0 if none

- *

+ *

* Takes a entity string content and process to do the adequate substitutions.

* [67] Reference ::= EntityRef | CharRef

@@ -2502,14 +2730,14 @@ xmlChar *

xmlStringLenDecodeEntities(xmlParserCtxtPtr ctxt, const xmlChar *str, int len,

int what, xmlChar end, xmlChar end2, xmlChar end3) {

xmlChar *buffer = NULL;

- int buffer_size = 0;

+ size_t buffer_size = 0;

+ size_t nbchars = 0;

xmlChar *current = NULL;

xmlChar *rep = NULL;

const xmlChar *last;

xmlEntityPtr ent;

int c,l;

- int nbchars = 0;

if ((ctxt == NULL) || (str == NULL) || (len < 0))

return(NULL);

@@ -2526,7 +2754,7 @@ xmlStringLenDecodeEntities(xmlParserCtxtPtr ctxt, const xmlChar *str, int len,

* allocate a translation buffer.

buffer_size = XML_PARSER_BIG_BUFFER_SIZE;

- buffer = (xmlChar *) xmlMallocAtomic(buffer_size * sizeof(xmlChar));

+ buffer = (xmlChar *) xmlMallocAtomic(buffer_size);

if (buffer == NULL) goto mem_error;

@@ -2546,7 +2774,7 @@ xmlStringLenDecodeEntities(xmlParserCtxtPtr ctxt, const xmlChar *str, int len,

if (val != 0) {

COPY_BUF(0,buffer,nbchars,val);

}

- if (nbchars > buffer_size - XML_PARSER_BUFFER_SIZE) {

+ if (nbchars + XML_PARSER_BUFFER_SIZE > buffer_size) {

growBuffer(buffer, XML_PARSER_BUFFER_SIZE);

}

} else if ((c == '&') && (what & XML_SUBSTITUTE_REF)) {

@@ -2558,13 +2786,14 @@ xmlStringLenDecodeEntities(xmlParserCtxtPtr ctxt, const xmlChar *str, int len,

if ((ctxt->lastError.code == XML_ERR_ENTITY_LOOP) ||

(ctxt->lastError.code == XML_ERR_INTERNAL_ERROR))

goto int_error;

+ xmlParserEntityCheck(ctxt, 0, ent, 0);

if (ent != NULL)

- ctxt->nbentities += ent->checked;

+ ctxt->nbentities += ent->checked / 2;

if ((ent != NULL) &&

(ent->etype == XML_INTERNAL_PREDEFINED_ENTITY)) {

if (ent->content != NULL) {

COPY_BUF(0,buffer,nbchars,ent->content[0]);

- if (nbchars > buffer_size - XML_PARSER_BUFFER_SIZE) {

+ if (nbchars + XML_PARSER_BUFFER_SIZE > buffer_size) {

growBuffer(buffer, XML_PARSER_BUFFER_SIZE);

}

} else {

@@ -2581,9 +2810,8 @@ xmlStringLenDecodeEntities(xmlParserCtxtPtr ctxt, const xmlChar *str, int len,

current = rep;

while (*current != 0) { /* non input consuming loop */

buffer[nbchars++] = *current++;

- if (nbchars >

- buffer_size - XML_PARSER_BUFFER_SIZE) {

- if (xmlParserEntityCheck(ctxt, nbchars, ent))

+ if (nbchars + XML_PARSER_BUFFER_SIZE > buffer_size) {

+ if (xmlParserEntityCheck(ctxt, nbchars, ent, 0))

goto int_error;

growBuffer(buffer, XML_PARSER_BUFFER_SIZE);

}

@@ -2596,7 +2824,7 @@ xmlStringLenDecodeEntities(xmlParserCtxtPtr ctxt, const xmlChar *str, int len,

const xmlChar *cur = ent->name;

buffer[nbchars++] = '&';

- if (nbchars > buffer_size - i - XML_PARSER_BUFFER_SIZE) {

+ if (nbchars + i + XML_PARSER_BUFFER_SIZE > buffer_size) {

growBuffer(buffer, i + XML_PARSER_BUFFER_SIZE);

}

for (;i > 0;i--)

@@ -2610,8 +2838,9 @@ xmlStringLenDecodeEntities(xmlParserCtxtPtr ctxt, const xmlChar *str, int len,

ent = xmlParseStringPEReference(ctxt, &str);

if (ctxt->lastError.code == XML_ERR_ENTITY_LOOP)

goto int_error;

+ xmlParserEntityCheck(ctxt, 0, ent, 0);

if (ent != NULL)

- ctxt->nbentities += ent->checked;

+ ctxt->nbentities += ent->checked / 2;

if (ent != NULL) {

if (ent->content == NULL) {

xmlLoadEntityContent(ctxt, ent);

@@ -2624,9 +2853,8 @@ xmlStringLenDecodeEntities(xmlParserCtxtPtr ctxt, const xmlChar *str, int len,

current = rep;

while (*current != 0) { /* non input consuming loop */

buffer[nbchars++] = *current++;

- if (nbchars >

- buffer_size - XML_PARSER_BUFFER_SIZE) {

- if (xmlParserEntityCheck(ctxt, nbchars, ent))

+ if (nbchars + XML_PARSER_BUFFER_SIZE > buffer_size) {

+ if (xmlParserEntityCheck(ctxt, nbchars, ent, 0))

goto int_error;

growBuffer(buffer, XML_PARSER_BUFFER_SIZE);

}

@@ -2638,8 +2866,8 @@ xmlStringLenDecodeEntities(xmlParserCtxtPtr ctxt, const xmlChar *str, int len,

} else {

COPY_BUF(l,buffer,nbchars,c);

str += l;

- if (nbchars > buffer_size - XML_PARSER_BUFFER_SIZE) {

- growBuffer(buffer, XML_PARSER_BUFFER_SIZE);

+ if (nbchars + XML_PARSER_BUFFER_SIZE > buffer_size) {

+ growBuffer(buffer, XML_PARSER_BUFFER_SIZE);

}

if (str < last)

@@ -2668,7 +2896,7 @@ int_error:

* @end: an end marker xmlChar, 0 if none

* @end2: an end marker xmlChar, 0 if none

* @end3: an end marker xmlChar, 0 if none

- *

+ *

* Takes a entity string content and process to do the adequate substitutions.

* [67] Reference ::= EntityRef | CharRef

@@ -3031,7 +3259,7 @@ xmlIsNameChar(xmlParserCtxtPtr ctxt, int c) {

} else {

if ((IS_LETTER(c)) || (IS_DIGIT(c)) ||

(c == '.') || (c == '-') ||

- (c == '_') || (c == ':') ||

+ (c == '_') || (c == ':') ||

(IS_COMBINING(c)) ||

(IS_EXTENDER(c)))

return(1);

@@ -3057,7 +3285,7 @@ xmlParseNameComplex(xmlParserCtxtPtr ctxt) {

GROW;

if (ctxt->instate == XML_PARSER_EOF)

- return(NULL);

+ return(NULL);

c = CUR_CHAR(l);

if ((ctxt->options & XML_PARSE_OLD10) == 0) {

@@ -3106,7 +3334,7 @@ xmlParseNameComplex(xmlParserCtxtPtr ctxt) {

((c >= 0xFDF0) && (c <= 0xFFFD)) ||

((c >= 0x10000) && (c <= 0xEFFFF))

)) {

- if (count++ > 100) {

+ if (count++ > XML_PARSER_CHUNK_SIZE) {

count = 0;

GROW;

if (ctxt->instate == XML_PARSER_EOF)

@@ -3129,10 +3357,10 @@ xmlParseNameComplex(xmlParserCtxtPtr ctxt) {

while ((c != ' ') && (c != '>') && (c != '/') && /* test bigname.xml */

((IS_LETTER(c)) || (IS_DIGIT(c)) ||

(c == '.') || (c == '-') ||

- (c == '_') || (c == ':') ||

+ (c == '_') || (c == ':') ||

(IS_COMBINING(c)) ||

(IS_EXTENDER(c)))) {

- if (count++ > 100) {

+ if (count++ > XML_PARSER_CHUNK_SIZE) {

count = 0;

GROW;

if (ctxt->instate == XML_PARSER_EOF)

@@ -3141,8 +3369,20 @@ xmlParseNameComplex(xmlParserCtxtPtr ctxt) {

len += l;

NEXTL(l);

c = CUR_CHAR(l);

+ if (c == 0) {

+ count = 0;

+ GROW;

+ if (ctxt->instate == XML_PARSER_EOF)

+ return(NULL);

+ c = CUR_CHAR(l);

+ }

}

+ if ((len > XML_MAX_NAME_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "Name");

+ return(NULL);

+ }

if ((*ctxt->input->cur == '\n') && (ctxt->input->cur[-1] == '\r'))

return(xmlDictLookup(ctxt->dict, ctxt->input->cur - (len + 1), len));

return(xmlDictLookup(ctxt->dict, ctxt->input->cur - len, len));

@@ -3192,6 +3432,11 @@ xmlParseName(xmlParserCtxtPtr ctxt) {

in++;

if ((*in > 0) && (*in < 0x80)) {

count = in - ctxt->input->cur;

+ if ((count > XML_MAX_NAME_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "Name");

+ return(NULL);

+ }

ret = xmlDictLookup(ctxt->dict, ctxt->input->cur, count);

ctxt->input->cur = in;

ctxt->nbChars += count;

@@ -3210,6 +3455,7 @@ xmlParseNCNameComplex(xmlParserCtxtPtr ctxt) {

int len = 0, l;

int c;

int count = 0;

+ const xmlChar *end; /* needed because CUR_CHAR() can move cur on \r\n */

#ifdef DEBUG

nbParseNCNameComplex++;

@@ -3219,6 +3465,7 @@ xmlParseNCNameComplex(xmlParserCtxtPtr ctxt) {

* Handler for more complex cases

GROW;

+ end = ctxt->input->cur;

c = CUR_CHAR(l);

if ((c == ' ') || (c == '>') || (c == '/') || /* accelerators */

(!xmlIsNameStartChar(ctxt, c) || (c == ':'))) {

@@ -3227,7 +3474,12 @@ xmlParseNCNameComplex(xmlParserCtxtPtr ctxt) {

while ((c != ' ') && (c != '>') && (c != '/') && /* test bigname.xml */

(xmlIsNameChar(ctxt, c) && (c != ':'))) {

- if (count++ > 100) {

+ if (count++ > XML_PARSER_CHUNK_SIZE) {

+ if ((len > XML_MAX_NAME_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NCName");

+ return(NULL);

+ }

count = 0;

GROW;

if (ctxt->instate == XML_PARSER_EOF)

@@ -3235,15 +3487,29 @@ xmlParseNCNameComplex(xmlParserCtxtPtr ctxt) {

}

len += l;

NEXTL(l);

+ end = ctxt->input->cur;

c = CUR_CHAR(l);

+ if (c == 0) {

+ count = 0;

+ GROW;

+ if (ctxt->instate == XML_PARSER_EOF)

+ return(NULL);

+ end = ctxt->input->cur;

+ c = CUR_CHAR(l);

+ }

}

- return(xmlDictLookup(ctxt->dict, ctxt->input->cur - len, len));

+ if ((len > XML_MAX_NAME_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NCName");

+ return(NULL);

+ }

+ return(xmlDictLookup(ctxt->dict, end - len, len));

}

/**

* xmlParseNCName:

* @ctxt: an XML parser context

- * @len: lenght of the string parsed

+ * @len: length of the string parsed

* parse an XML name.

@@ -3281,6 +3547,11 @@ xmlParseNCName(xmlParserCtxtPtr ctxt) {

in++;

if ((*in > 0) && (*in < 0x80)) {

count = in - ctxt->input->cur;

+ if ((count > XML_MAX_NAME_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NCName");

+ return(NULL);

+ }

ret = xmlDictLookup(ctxt->dict, ctxt->input->cur, count);

ctxt->input->cur = in;

ctxt->nbChars += count;

@@ -3349,7 +3620,7 @@ xmlParseNameAndCompare(xmlParserCtxtPtr ctxt, xmlChar const *other) {

* [6] Names ::= Name (#x20 Name)*

- * Returns the Name parsed or NULL. The @str pointer

+ * Returns the Name parsed or NULL. The @str pointer

* is updated to the current location in the string.

@@ -3393,6 +3664,13 @@ xmlParseStringName(xmlParserCtxtPtr ctxt, const xmlChar** str) {

while (xmlIsNameChar(ctxt, c)) {

if (len + 10 > max) {

xmlChar *tmp;

+ if ((len > XML_MAX_NAME_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NCName");

+ xmlFree(buffer);

+ return(NULL);

+ }

max *= 2;

tmp = (xmlChar *) xmlRealloc(buffer,

max * sizeof(xmlChar));

@@ -3412,6 +3690,11 @@ xmlParseStringName(xmlParserCtxtPtr ctxt, const xmlChar** str) {

return(buffer);

}

+ if ((len > XML_MAX_NAME_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NCName");

+ return(NULL);

+ }

*str = cur;

return(xmlStrndup(buf, len));

}

@@ -3446,13 +3729,20 @@ xmlParseNmtoken(xmlParserCtxtPtr ctxt) {

c = CUR_CHAR(l);

while (xmlIsNameChar(ctxt, c)) {

- if (count++ > 100) {

+ if (count++ > XML_PARSER_CHUNK_SIZE) {

count = 0;

GROW;

}

COPY_BUF(l,buf,len,c);

NEXTL(l);

c = CUR_CHAR(l);

+ if (c == 0) {

+ count = 0;

+ GROW;

+ if (ctxt->instate == XML_PARSER_EOF)

+ return(NULL);

+ c = CUR_CHAR(l);

+ }

if (len >= XML_MAX_NAMELEN) {

* Okay someone managed to make a huge token, so he's ready to pay

@@ -3468,7 +3758,7 @@ xmlParseNmtoken(xmlParserCtxtPtr ctxt) {

}

memcpy(buffer, buf, len);

while (xmlIsNameChar(ctxt, c)) {

- if (count++ > 100) {

+ if (count++ > XML_PARSER_CHUNK_SIZE) {

count = 0;

GROW;

if (ctxt->instate == XML_PARSER_EOF) {

@@ -3479,6 +3769,12 @@ xmlParseNmtoken(xmlParserCtxtPtr ctxt) {

if (len + 10 > max) {

xmlChar *tmp;

+ if ((max > XML_MAX_NAME_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NmToken");

+ xmlFree(buffer);

+ return(NULL);

+ }

max *= 2;

tmp = (xmlChar *) xmlRealloc(buffer,

max * sizeof(xmlChar));

@@ -3499,6 +3795,11 @@ xmlParseNmtoken(xmlParserCtxtPtr ctxt) {

}

if (len == 0)

return(NULL);

+ if ((len > XML_MAX_NAME_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "NmToken");

+ return(NULL);

+ }

return(xmlStrndup(buf, len));

}

@@ -3556,7 +3857,7 @@ xmlParseEntityValue(xmlParserCtxtPtr ctxt, xmlChar **orig) {

* When a parameter entity reference appears in a literal entity

* value, ... a single or double quote character in the replacement

* text is always treated as a normal data character and will not

- * terminate the literal.

+ * terminate the literal.

* In practice it means we stop the loop only when back at parsing

* the initial entity and the quote is found

@@ -3667,8 +3968,8 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

xmlChar limit = 0;

xmlChar *buf = NULL;

xmlChar *rep = NULL;

- int len = 0;

- int buf_size = 0;

+ size_t len = 0;

+ size_t buf_size = 0;

int c, l, in_space = 0;

xmlChar *current = NULL;

xmlEntityPtr ent;

@@ -3690,7 +3991,7 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

* allocate a translation buffer.

buf_size = XML_PARSER_BUFFER_SIZE;

- buf = (xmlChar *) xmlMallocAtomic(buf_size * sizeof(xmlChar));

+ buf = (xmlChar *) xmlMallocAtomic(buf_size);

if (buf == NULL) goto mem_error;

@@ -3700,6 +4001,16 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

while (((NXT(0) != limit) && /* checked */

(IS_CHAR(c)) && (c != '<')) &&

(ctxt->instate != XML_PARSER_EOF)) {

+ /*

+ * Impose a reasonable limit on attribute size, unless XML_PARSE_HUGE

+ * special option is given

+ */

+ if ((len > XML_MAX_TEXT_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErrMsg(ctxt, XML_ERR_ATTRIBUTE_NOT_FINISHED,

+ "AttValue length too long\n");

+ goto mem_error;

+ }

if (c == 0) break;

if (c == '&') {

in_space = 0;

@@ -3708,7 +4019,7 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

if (val == '&') {

if (ctxt->replaceEntities) {

- if (len > buf_size - 10) {

+ if (len + 10 > buf_size) {

growBuffer(buf, 10);

}

buf[len++] = '&';

@@ -3717,7 +4028,7 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

* The reparsing will be done in xmlStringGetNodeList()

* called by the attribute() function in SAX.c

- if (len > buf_size - 10) {

+ if (len + 10 > buf_size) {

growBuffer(buf, 10);

}

buf[len++] = '&';

@@ -3727,7 +4038,7 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

buf[len++] = ';';

}

} else if (val != 0) {

- if (len > buf_size - 10) {

+ if (len + 10 > buf_size) {

growBuffer(buf, 10);

}

len += xmlCopyChar(0, &buf[len], val);

@@ -3739,7 +4050,7 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

ctxt->nbentities += ent->owner;

if ((ent != NULL) &&

(ent->etype == XML_INTERNAL_PREDEFINED_ENTITY)) {

- if (len > buf_size - 10) {

+ if (len + 10 > buf_size) {

growBuffer(buf, 10);

}

if ((ctxt->replaceEntities == 0) &&

@@ -3752,7 +4063,7 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

} else {

buf[len++] = ent->content[0];

}

- } else if ((ent != NULL) &&

+ } else if ((ent != NULL) &&

(ctxt->replaceEntities != 0)) {

if (ent->etype != XML_INTERNAL_PREDEFINED_ENTITY) {

rep = xmlStringDecodeEntities(ctxt, ent->content,

@@ -3767,7 +4078,7 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

current++;

} else

buf[len++] = *current++;

- if (len > buf_size - 10) {

+ if (len + 10 > buf_size) {

growBuffer(buf, 10);

}

@@ -3775,7 +4086,7 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

rep = NULL;

}

} else {

- if (len > buf_size - 10) {

+ if (len + 10 > buf_size) {

growBuffer(buf, 10);

}

if (ent->content != NULL)

@@ -3790,10 +4101,16 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

* entities problems

if ((ent->etype != XML_INTERNAL_PREDEFINED_ENTITY) &&

- (ent->content != NULL)) {

+ (ent->content != NULL) && (ent->checked == 0)) {

+ unsigned long oldnbent = ctxt->nbentities;

rep = xmlStringDecodeEntities(ctxt, ent->content,

XML_SUBSTITUTE_REF, 0, 0, 0);

+ ent->checked = (ctxt->nbentities - oldnbent + 1) * 2;

if (rep != NULL) {

+ if (xmlStrchr(rep, '<'))

+ ent->checked |= 1;

xmlFree(rep);

rep = NULL;

}

@@ -3803,7 +4120,7 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

* Just output the reference

buf[len++] = '&';

- while (len > buf_size - i - 10) {

+ while (len + i + 10 > buf_size) {

growBuffer(buf, i + 10);

}

for (;i > 0;i--)

@@ -3816,7 +4133,7 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

if ((len != 0) || (!normalize)) {

if ((!normalize) || (!in_space)) {

COPY_BUF(l,buf,len,0x20);

- while (len > buf_size - 10) {

+ while (len + 10 > buf_size) {

growBuffer(buf, 10);

}

@@ -3825,7 +4142,7 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

} else {

in_space = 0;

COPY_BUF(l,buf,len,c);

- if (len > buf_size - 10) {

+ if (len + 10 > buf_size) {

growBuffer(buf, 10);

}

@@ -3853,7 +4170,18 @@ xmlParseAttValueComplex(xmlParserCtxtPtr ctxt, int *attlen, int normalize) {

}

} else

NEXT;

- if (attlen != NULL) *attlen = len;

+ /*

+ * There we potentially risk an overflow, don't allow attribute value of

+ * length more than INT_MAX it is a very reasonnable assumption !

+ */

+ if (len >= INT_MAX) {

+ xmlFatalErrMsg(ctxt, XML_ERR_ATTRIBUTE_NOT_FINISHED,

+ "AttValue length too long\n");

+ goto mem_error;

+ }

+ if (attlen != NULL) *attlen = (int) len;

return(buf);

mem_error:

@@ -3879,20 +4207,20 @@ error:

* 3.3.3 Attribute-Value Normalization:

* Before the value of an attribute is passed to the application or

- * checked for validity, the XML processor must normalize it as follows:

+ * checked for validity, the XML processor must normalize it as follows:

* - a character reference is processed by appending the referenced

* character to the attribute value

* - an entity reference is processed by recursively processing the

- * replacement text of the entity

+ * replacement text of the entity

* - a whitespace character (#x20, #xD, #xA, #x9) is processed by

* appending #x20 to the normalized value, except that only a single

* #x20 is appended for a "#xD#xA" sequence that is part of an external

- * parsed entity or the literal entity value of an internal parsed entity

- * - other characters are processed by appending them to the normalized value

+ * parsed entity or the literal entity value of an internal parsed entity

+ * - other characters are processed by appending them to the normalized value

* If the declared value is not CDATA, then the XML processor must further

* process the normalized attribute value by discarding any leading and

* trailing space (#x20) characters, and by replacing sequences of space

- * (#x20) characters by a single space (#x20) character.

+ * (#x20) characters by a single space (#x20) character.

* All attributes for which no declaration has been read should be treated

* by a non-validating parser as if declared CDATA.

@@ -3909,7 +4237,7 @@ xmlParseAttValue(xmlParserCtxtPtr ctxt) {

/**

* xmlParseSystemLiteral:

* @ctxt: an XML parser context

- *

+ *

* parse an XML Literal

* [11] SystemLiteral ::= ('"' [^"]* '"') | ("'" [^']* "'")

@@ -3938,7 +4266,7 @@ xmlParseSystemLiteral(xmlParserCtxtPtr ctxt) {

xmlFatalErr(ctxt, XML_ERR_LITERAL_NOT_STARTED, NULL);

return(NULL);

}

buf = (xmlChar *) xmlMallocAtomic(size * sizeof(xmlChar));

if (buf == NULL) {

xmlErrMemory(ctxt, NULL);

@@ -3950,6 +4278,13 @@ xmlParseSystemLiteral(xmlParserCtxtPtr ctxt) {

if (len + 5 >= size) {

xmlChar *tmp;

+ if ((size > XML_MAX_NAME_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "SystemLiteral");

+ xmlFree(buf);

+ ctxt->instate = (xmlParserInputState) state;

+ return(NULL);

+ }

size *= 2;

tmp = (xmlChar *) xmlRealloc(buf, size * sizeof(xmlChar));

if (tmp == NULL) {

@@ -4031,6 +4366,12 @@ xmlParsePubidLiteral(xmlParserCtxtPtr ctxt) {

if (len + 1 >= size) {

xmlChar *tmp;

+ if ((size > XML_MAX_NAME_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErr(ctxt, XML_ERR_NAME_TOO_LONG, "Public ID");

+ xmlFree(buf);

+ return(NULL);

+ }

size *= 2;

tmp = (xmlChar *) xmlRealloc(buf, size * sizeof(xmlChar));

if (tmp == NULL) {

@@ -4119,7 +4460,7 @@ static const unsigned char test_char_data[256] = {

* The right angle bracket (>) may be represented using the string ">",

* and must, for compatibility, be escaped using ">" or a character

* reference when it appears in the string "]]>" in content, when that

- * string is not marking the end of a CDATA section.

+ * string is not marking the end of a CDATA section.

* [14] CharData ::= [^<&]* - ([^<&]* ']]>' [^<&]*)

@@ -4286,7 +4627,7 @@ xmlParseCharDataComplex(xmlParserCtxtPtr ctxt, int cdata) {

GROW;

cur = CUR_CHAR(l);

while ((cur != '<') && /* checked */

- (cur != '&') &&

+ (cur != '&') &&

(IS_CHAR(cur))) /* test also done in xmlCurrentChar() */ {

if ((cur == ']') && (NXT(1) == ']') &&

(NXT(2) == '>')) {

@@ -4419,7 +4760,7 @@ xmlParseExternalID(xmlParserCtxtPtr ctxt, xmlChar **publicID, int strict) {

}

} else {

- * We handle [83] so we return immediately, if

+ * We handle [83] so we return immediately, if

* "S SystemLiteral" is not detected. From a purely parsing

* point of view that's a nice mess.

@@ -4428,7 +4769,7 @@ xmlParseExternalID(xmlParserCtxtPtr ctxt, xmlChar **publicID, int strict) {

ptr = CUR_PTR;

if (!IS_BLANK_CH(*ptr)) return(NULL);

while (IS_BLANK_CH(*ptr)) ptr++; /* TODO: dangerous, fix ! */

if ((*ptr != '\'') && (*ptr != '"')) return(NULL);

}

@@ -4456,11 +4797,12 @@ xmlParseExternalID(xmlParserCtxtPtr ctxt, xmlChar **publicID, int strict) {

* [15] Comment ::= ''

static void

-xmlParseCommentComplex(xmlParserCtxtPtr ctxt, xmlChar *buf, int len, int size) {

+xmlParseCommentComplex(xmlParserCtxtPtr ctxt, xmlChar *buf,

+ size_t len, size_t size) {

int q, ql;

int r, rl;

int cur, l;

- int count = 0;

+ size_t count = 0;

int inputid;

inputid = ctxt->input->id;

@@ -4506,16 +4848,26 @@ xmlParseCommentComplex(xmlParserCtxtPtr ctxt, xmlChar *buf, int len, int size) {

if ((r == '-') && (q == '-')) {

xmlFatalErr(ctxt, XML_ERR_HYPHEN_IN_COMMENT, NULL);

}

+ if ((len > XML_MAX_TEXT_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErrMsgStr(ctxt, XML_ERR_COMMENT_NOT_FINISHED,

+ "Comment too big found", NULL);

+ xmlFree (buf);

+ return;

+ }

if (len + 5 >= size) {

xmlChar *new_buf;

- size *= 2;

- new_buf = (xmlChar *) xmlRealloc(buf, size * sizeof(xmlChar));

+ size_t new_size;

+ new_size = size * 2;

+ new_buf = (xmlChar *) xmlRealloc(buf, new_size);

if (new_buf == NULL) {

xmlFree (buf);

xmlErrMemory(ctxt, NULL);

return;

}

buf = new_buf;

+ size = new_size;

}

COPY_BUF(ql,buf,len,q);

q = r;

@@ -4580,11 +4932,12 @@ not_terminated:

void

xmlParseComment(xmlParserCtxtPtr ctxt) {

xmlChar *buf = NULL;

- int size = XML_PARSER_BUFFER_SIZE;

- int len = 0;

+ size_t size = XML_PARSER_BUFFER_SIZE;

+ size_t len = 0;

xmlParserInputState state;

const xmlChar *in;

- int nbchar = 0, ccol;

+ size_t nbchar = 0;

+ int ccol;

int inputid;

@@ -4664,6 +5017,13 @@ get_more:

buf[len] = 0;

}

+ if ((len > XML_MAX_TEXT_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErrMsgStr(ctxt, XML_ERR_COMMENT_NOT_FINISHED,

+ "Comment too big found", NULL);

+ xmlFree (buf);

+ return;

+ }

ctxt->input->cur = in;

if (*in == 0xA) {

in++;

@@ -4684,7 +5044,7 @@ get_more:

if (ctxt->instate == XML_PARSER_EOF) {

xmlFree(buf);

return;

- }

+ }

in = ctxt->input->cur;

if (*in == '-') {

if (in[1] == '-') {

@@ -4707,13 +5067,14 @@ get_more:

ctxt->instate = state;

return;

}

- if (buf != NULL)

- xmlFatalErrMsgStr(ctxt, XML_ERR_COMMENT_NOT_FINISHED,

- "Comment not terminated \n<!--%.50s\n",

+ if (buf != NULL) {

+ xmlFatalErrMsgStr(ctxt, XML_ERR_HYPHEN_IN_COMMENT,

+ "Double hyphen within comment: "

+ "<!--%.50s\n",

buf);

- else

- xmlFatalErrMsgStr(ctxt, XML_ERR_COMMENT_NOT_FINISHED,

- "Comment not terminated \n", NULL);

+ } else

+ xmlFatalErrMsgStr(ctxt, XML_ERR_HYPHEN_IN_COMMENT,

+ "Double hyphen within comment\n", NULL);

in++;

ctxt->input->col++;

}

@@ -4731,7 +5092,7 @@ get_more:

/**

* xmlParsePITarget:

* @ctxt: an XML parser context

- *

+ *

* parse the name of a PI

* [17] PITarget ::= Name - (('X' | 'x') ('M' | 'm') ('L' | 'l'))

@@ -4768,8 +5129,8 @@ xmlParsePITarget(xmlParserCtxtPtr ctxt) {

NULL, NULL);

}

if ((name != NULL) && (xmlStrchr(name, ':') != NULL)) {

- xmlNsErr(ctxt, XML_NS_ERR_COLON,

- "colon are forbidden from PI names '%s'\n", name, NULL, NULL);

+ xmlNsErr(ctxt, XML_NS_ERR_COLON,

+ "colons are forbidden from PI names '%s'\n", name, NULL, NULL);

}

return(name);

}

@@ -4779,7 +5140,7 @@ xmlParsePITarget(xmlParserCtxtPtr ctxt) {

* xmlParseCatalogPI:

* @ctxt: an XML parser context

* @catalog: the PI value string

- *

+ *

* parse an XML Catalog Processing Instruction.

* <?oasis-xml-catalog catalog="http://example.com/catalog.xml"?>

@@ -4839,7 +5200,7 @@ error:

/**

* xmlParsePI:

* @ctxt: an XML parser context

- *

+ *

* parse an XML Processing Instruction.

* [16] PI ::= '<?' PITarget (S (Char* - (Char* '?>' Char*)))? '?>'

@@ -4850,8 +5211,8 @@ error:

void

xmlParsePI(xmlParserCtxtPtr ctxt) {

xmlChar *buf = NULL;

- int len = 0;

- int size = XML_PARSER_BUFFER_SIZE;

+ size_t len = 0;

+ size_t size = XML_PARSER_BUFFER_SIZE;

int cur, l;

const xmlChar *target;

xmlParserInputState state;

@@ -4908,9 +5269,8 @@ xmlParsePI(xmlParserCtxtPtr ctxt) {

((cur != '?') || (NXT(1) != '>'))) {

if (len + 5 >= size) {

xmlChar *tmp;

- size *= 2;

- tmp = (xmlChar *) xmlRealloc(buf, size * sizeof(xmlChar));

+ size_t new_size = size * 2;

+ tmp = (xmlChar *) xmlRealloc(buf, new_size);

if (tmp == NULL) {

xmlErrMemory(ctxt, NULL);

xmlFree(buf);

@@ -4918,6 +5278,7 @@ xmlParsePI(xmlParserCtxtPtr ctxt) {

return;

}

buf = tmp;

+ size = new_size;

}

count++;

if (count > 50) {

@@ -4927,6 +5288,14 @@ xmlParsePI(xmlParserCtxtPtr ctxt) {

return;

}

count = 0;

+ if ((len > XML_MAX_TEXT_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErrMsgStr(ctxt, XML_ERR_PI_NOT_FINISHED,

+ "PI %s too big found", target);

+ xmlFree(buf);

+ ctxt->instate = state;

+ return;

+ }

}

COPY_BUF(l,buf,len,cur);

NEXTL(l);

@@ -4937,6 +5306,14 @@ xmlParsePI(xmlParserCtxtPtr ctxt) {

cur = CUR_CHAR(l);

}

+ if ((len > XML_MAX_TEXT_LENGTH) &&

+ ((ctxt->options & XML_PARSE_HUGE) == 0)) {

+ xmlFatalErrMsgStr(ctxt, XML_ERR_PI_NOT_FINISHED,

+ "PI %s too big found", target);

+ xmlFree(buf);

+ ctxt->instate = state;

+ return;

+ }

buf[len] = 0;

if (cur != '?') {

xmlFatalErrMsgStr(ctxt, XML_ERR_PI_NOT_FINISHED,

@@ -4998,7 +5375,7 @@ xmlParseNotationDecl(xmlParserCtxtPtr ctxt) {

const xmlChar *name;

xmlChar *Pubid;

xmlChar *Systemid;

if (CMP10(CUR_PTR, '<', '!', 'N', 'O', 'T', 'A', 'T', 'I', 'O', 'N')) {

xmlParserInputPtr input = ctxt->input;

SHRINK;

@@ -5021,8 +5398,8 @@ xmlParseNotationDecl(xmlParserCtxtPtr ctxt) {

return;

}

if (xmlStrchr(name, ':') != NULL) {

- xmlNsErr(ctxt, XML_NS_ERR_COLON,

- "colon are forbidden from notation names '%s'\n",

+ xmlNsErr(ctxt, XML_NS_ERR_COLON,

+ "colons are forbidden from notation names '%s'\n",

name, NULL, NULL);

}

SKIP_BLANKS;

@@ -5081,7 +5458,7 @@ xmlParseEntityDecl(xmlParserCtxtPtr ctxt) {

int isParameter = 0;

xmlChar *orig = NULL;

int skipped;

/* GROW; done in the caller */

if (CMP8(CUR_PTR, '<', '!', 'E', 'N', 'T', 'I', 'T', 'Y')) {

xmlParserInputPtr input = ctxt->input;

@@ -5110,8 +5487,8 @@ xmlParseEntityDecl(xmlParserCtxtPtr ctxt) {

return;

}

if (xmlStrchr(name, ':') != NULL) {

- xmlNsErr(ctxt, XML_NS_ERR_COLON,

- "colon are forbidden from entities names '%s'\n",

+ xmlNsErr(ctxt, XML_NS_ERR_COLON,

+ "colons are forbidden from entities names '%s'\n",

name, NULL, NULL);

}

skipped = SKIP_BLANKS;

@@ -5340,13 +5717,13 @@ xmlParseEntityDecl(xmlParserCtxtPtr ctxt) {

* [ VC: Fixed Attribute Default ]

* if an attribute has a default value declared with the #FIXED

- * keyword, instances of that attribute must match the default value.

+ * keyword, instances of that attribute must match the default value.

* [ WFC: No < in Attribute Values ]

* handled in xmlParseAttValue()

* returns: XML_ATTRIBUTE_NONE, XML_ATTRIBUTE_REQUIRED, XML_ATTRIBUTE_IMPLIED

- * or XML_ATTRIBUTE_FIXED.

+ * or XML_ATTRIBUTE_FIXED.

int

@@ -5395,7 +5772,7 @@ xmlParseDefaultDecl(xmlParserCtxtPtr ctxt, xmlChar **value) {

* [ VC: Notation Attributes ]

* Values of this type must match one of the notation names included

- * in the declaration; all notation names in the declaration must be declared.

+ * in the declaration; all notation names in the declaration must be declared.

* Returns: the notation attribute tree built while parsing

@@ -5595,15 +5972,15 @@ xmlParseEnumeratedType(xmlParserCtxtPtr ctxt, xmlEnumerationPtr *tree) {

* [ VC: Entity Name ]

* Values of type ENTITY must match the Name production, values

* of type ENTITIES must match Names; each Entity Name must match the

- * name of an unparsed entity declared in the DTD.

+ * name of an unparsed entity declared in the DTD.

* [ VC: Name Token ]

* Values of type NMTOKEN must match the Nmtoken production; values

- * of type NMTOKENS must match Nmtokens.

+ * of type NMTOKENS must match Nmtokens.

* Returns the attribute type

-int

+int

xmlParseAttributeType(xmlParserCtxtPtr ctxt, xmlEnumerationPtr *tree) {

SHRINK;

if (CMP5(CUR_PTR, 'C', 'D', 'A', 'T', 'A')) {

@@ -5746,7 +6123,7 @@ xmlParseAttributeListDecl(xmlParserCtxtPtr ctxt) {

xmlFreeEnumeration(tree);

if ((ctxt->sax2) && (defaultValue != NULL) &&

- (def != XML_ATTRIBUTE_IMPLIED) &&

+ (def != XML_ATTRIBUTE_IMPLIED) &&

(def != XML_ATTRIBUTE_REQUIRED)) {

xmlAddDefAttrs(ctxt, elemName, attrName, defaultValue);

}

@@ -5775,7 +6152,7 @@ xmlParseAttributeListDecl(xmlParserCtxtPtr ctxt) {

* parse the declaration for a Mixed Element content

* The leading '(' and spaces have been skipped in xmlParseElementContentDecl

- *

+ *

* [51] Mixed ::= '(' S? '#PCDATA' (S? '|' S? Name)* S? ')*' |

* '(' S? '#PCDATA' S? ')'

@@ -5783,7 +6160,7 @@ xmlParseAttributeListDecl(xmlParserCtxtPtr ctxt) {

* [ VC: No Duplicate Types ]

* The same name must not appear more than once in a single

- * mixed-content declaration.

+ * mixed-content declaration.

* returns: the list of the xmlElementContentPtr describing the element choices

@@ -5883,7 +6260,7 @@ xmlParseElementMixedContentDecl(xmlParserCtxtPtr ctxt, int inputchk) {

* parse the declaration for a Mixed Element content

* The leading '(' and spaces have been skipped in xmlParseElementContentDecl

- *

+ *

* [47] children ::= (choice | seq) ('?' | '*' | '+')?

@@ -5904,7 +6281,7 @@ xmlParseElementMixedContentDecl(xmlParserCtxtPtr ctxt, int inputchk) {

* be empty, and neither the first nor last non-blank character of

* the replacement text should be a connector (| or ,).

- * Returns the tree of xmlElementContentPtr describing the element

+ * Returns the tree of xmlElementContentPtr describing the element

* hierarchy.

static xmlElementContentPtr

@@ -6217,7 +6594,7 @@ xmlParseElementChildrenContentDecl(xmlParserCtxtPtr ctxt, int inputchk) {

* parse the declaration for an Element content either Mixed or Children,

* the cases EMPTY and ANY are handled directly in xmlParseElementDecl

- *

+ *

* [46] contentspec ::= 'EMPTY' | 'ANY' | Mixed | children

* returns: the type of element content XML_ELEMENT_TYPE_xxx

@@ -6345,7 +6722,7 @@ xmlParseElementDecl(xmlParserCtxtPtr ctxt) {

xmlFatalErrMsg(ctxt, XML_ERR_ENTITY_BOUNDARY,

"Element declaration doesn't start and stop in the same entity\n");

}

NEXT;

if ((ctxt->sax != NULL) && (!ctxt->disableSAX) &&

(ctxt->sax->elementDecl != NULL)) {

@@ -6357,7 +6734,7 @@ xmlParseElementDecl(xmlParserCtxtPtr ctxt) {

* this is a trick: if xmlAddElementDecl is called,

* instead of copying the full tree it is plugged directly

- * if called from the parser. Avoid duplicating the

+ * if called from the parser. Avoid duplicating the

* interfaces or change the API/ABI

xmlFreeDocElementContent(ctxt->myDoc, content);

@@ -6374,8 +6751,8 @@ xmlParseElementDecl(xmlParserCtxtPtr ctxt) {

* xmlParseConditionalSections

* @ctxt: an XML parser context

- * [61] conditionalSect ::= includeSect | ignoreSect

- * [62] includeSect ::= '<![' S? 'INCLUDE' S? '[' extSubsetDecl ']]>'

+ * [61] conditionalSect ::= includeSect | ignoreSect

+ * [62] includeSect ::= '<![' S? 'INCLUDE' S? '[' extSubsetDecl ']]>'

* [63] ignoreSect ::= '<![' S? 'IGNORE' S? '[' ignoreSectContents* ']]>'

* [64] ignoreSectContents ::= Ignore ('<![' ignoreSectContents ']]>' Ignore)*

* [65] Ignore ::= Char* - (Char* ('<![' | ']]>') Char*)

@@ -6527,7 +6904,7 @@ xmlParseConditionalSections(xmlParserCtxtPtr ctxt) {

/**

* xmlParseMarkupDecl:

* @ctxt: an XML parser context

- *

+ *

* parse Markup declarations

* [29] markupdecl ::= elementdecl | AttlistDecl | EntityDecl |

@@ -6544,7 +6921,7 @@ xmlParseConditionalSections(xmlParserCtxtPtr ctxt) {

* In the internal DTD subset, parameter-entity references can occur

* only where markup declarations can occur, not within markup declarations.

* (This does not apply to references that occur in external parameter

- * entities or to the external subset.)

+ * entities or to the external subset.)

void

xmlParseMarkupDecl(xmlParserCtxtPtr ctxt) {

@@ -6673,7 +7050,7 @@ xmlParseTextDecl(xmlParserCtxtPtr ctxt) {

* @ctxt: an XML parser context

* @ExternalID: the external identifier

* @SystemID: the system identifier (or URL)

- *

+ *

* parse Markup declarations from an external subset

* [30] extSubset ::= textDecl? extSubsetDecl

@@ -6686,7 +7063,7 @@ xmlParseExternalSubset(xmlParserCtxtPtr ctxt, const xmlChar *ExternalID,

xmlDetectSAX2(ctxt);

GROW;

- if ((ctxt->encoding == (const xmlChar *)XML_CHAR_ENCODING_NONE) &&

+ if ((ctxt->encoding == NULL) &&

(ctxt->input->end - ctxt->input->cur >= 4)) {

xmlChar start[4];

xmlCharEncoding enc;

@@ -6852,8 +7229,15 @@ xmlParseReference(xmlParserCtxtPtr ctxt) {

* The first reference to the entity trigger a parsing phase

* where the ent->children is filled with the result from

* the parsing.

- */

- if (ent->checked == 0) {

+ * Note: external parsed entities will not be loaded, it is not

+ * required for a non-validating parser, unless the parsing option

+ * of validating, or substituting entities were given. Doing so is

+ * far more secure as the parser will only process data coming from

+ * the document entity by default.

+ */

+ if ((ent->checked == 0) &&

+ ((ent->etype != XML_EXTERNAL_GENERAL_PARSED_ENTITY) ||

+ (ctxt->options & (XML_PARSE_NOENT | XML_PARSE_DTDVALID)))) {

unsigned long oldnbent = ctxt->nbentities;

@@ -6895,13 +7279,15 @@ xmlParseReference(xmlParserCtxtPtr ctxt) {

* Store the number of entities needing parsing for this entity

* content and do checkings

- ent->checked = ctxt->nbentities - oldnbent;

+ ent->checked = (ctxt->nbentities - oldnbent + 1) * 2;

+ if ((ent->content != NULL) && (xmlStrchr(ent->content, '<')))

+ ent->checked |= 1;

if (ret == XML_ERR_ENTITY_LOOP) {

xmlFatalErr(ctxt, XML_ERR_ENTITY_LOOP, NULL);

xmlFreeNodeList(list);

return;

}

- if (xmlParserEntityCheck(ctxt, 0, ent)) {

+ if (xmlParserEntityCheck(ctxt, 0, ent, 0)) {

xmlFreeNodeList(list);

return;

}

@@ -6941,6 +7327,7 @@ xmlParseReference(xmlParserCtxtPtr ctxt) {

ent->owner = 1;

while (list != NULL) {

list->parent = (xmlNodePtr) ent;

+ xmlSetTreeDoc(list, ent->doc);

if (list->next == NULL)

ent->last = list;

list = list->next;

@@ -6954,14 +7341,15 @@ xmlParseReference(xmlParserCtxtPtr ctxt) {

(ret != XML_WAR_UNDECLARED_ENTITY)) {

xmlFatalErrMsgStr(ctxt, XML_ERR_UNDECLARED_ENTITY,

"Entity '%s' failed to parse\n", ent->name);

+ xmlParserEntityCheck(ctxt, 0, ent, 0);

} else if (list != NULL) {

xmlFreeNodeList(list);

list = NULL;

}

if (ent->checked == 0)

- ent->checked = 1;

+ ent->checked = 2;

} else if (ent->checked != 1) {

- ctxt->nbentities += ent->checked;

+ ctxt->nbentities += ent->checked / 2;

}

@@ -7052,14 +7440,19 @@ xmlParseReference(xmlParserCtxtPtr ctxt) {

* Seems we are generating the DOM content, do

* a simple tree copy for all references except the first

* In the first occurrence list contains the replacement.

- * progressive == 2 means we are operating on the Reader

- * and since nodes are discarded we must copy all the time.

if (((list == NULL) && (ent->owner == 0)) ||

(ctxt->parseMode == XML_PARSE_READER)) {

xmlNodePtr nw = NULL, cur, firstChild = NULL;

+ * We are copying here, make sure there is no abuse

+ */

+ ctxt->sizeentcopy += ent->length + 5;

+ if (xmlParserEntityCheck(ctxt, 0, ent, ctxt->sizeentcopy))

+ return;

+ /*

* when operating on a reader, the entities definitions

* are always owning the entities subtree.

if (ctxt->parseMode == XML_PARSE_READER)

@@ -7096,9 +7489,17 @@ xmlParseReference(xmlParserCtxtPtr ctxt) {

if (ent->etype == XML_EXTERNAL_GENERAL_PARSED_ENTITY)

xmlAddEntityReference(ent, firstChild, nw);

#endif /* LIBXML_LEGACY_ENABLED */

- } else if (list == NULL) {

+ } else if ((list == NULL) || (ctxt->inputNr > 0)) {

xmlNodePtr nw = NULL, cur, next, last,

firstChild = NULL;

+ /*

+ * We are copying here, make sure there is no abuse

+ */

+ ctxt->sizeentcopy += ent->length + 5;

+ if (xmlParserEntityCheck(ctxt, 0, ent, ctxt->sizeentcopy))

+ return;

* Copy the entity child list and make it the new

* entity child list. The goal is to make sure any

@@ -7215,7 +7616,7 @@ xmlParseEntityRef(xmlParserCtxtPtr ctxt) {

NEXT;

- * Predefined entites override any extra definition

+ * Predefined entities override any extra definition

if ((ctxt->options & XML_PARSE_OLDSAX) == 0) {

ent = xmlGetPredefinedEntity(name);

@@ -7224,7 +7625,7 @@ xmlParseEntityRef(xmlParserCtxtPtr ctxt) {

}

- * Increate the number of entity references parsed

+ * Increase the number of entity references parsed

ctxt->nbentities++;

@@ -7235,7 +7636,7 @@ xmlParseEntityRef(xmlParserCtxtPtr ctxt) {

if (ctxt->sax != NULL) {

if (ctxt->sax->getEntity != NULL)

ent = ctxt->sax->getEntity(ctxt->userData, name);

- if ((ctxt->wellFormed == 1 ) && (ent == NULL) &&

+ if ((ctxt->wellFormed == 1 ) && (ent == NULL) &&

(ctxt->options & XML_PARSE_OLDSAX))

ent = xmlGetPredefinedEntity(name);

if ((ctxt->wellFormed == 1 ) && (ent == NULL) &&

@@ -7281,6 +7682,7 @@ xmlParseEntityRef(xmlParserCtxtPtr ctxt) {

ctxt->sax->reference(ctxt->userData, name);

}

+ xmlParserEntityCheck(ctxt, 0, ent, 0);

ctxt->valid = 0;

}

@@ -7308,14 +7710,16 @@ xmlParseEntityRef(xmlParserCtxtPtr ctxt) {

* [ WFC: No < in Attribute Values ]

* The replacement text of any entity referred to directly or

* indirectly in an attribute value (other than "<") must

- * not contain a <.

+ * not contain a <.

else if ((ctxt->instate == XML_PARSER_ATTRIBUTE_VALUE) &&

- (ent != NULL) && (ent->content != NULL) &&

- (ent->etype != XML_INTERNAL_PREDEFINED_ENTITY) &&

- (xmlStrchr(ent->content, '<'))) {

- xmlFatalErrMsgStr(ctxt, XML_ERR_LT_IN_ATTRIBUTE,

- "'<' in entity '%s' is not allowed in attributes values\n", name);

+ (ent != NULL) &&

+ (ent->etype != XML_INTERNAL_PREDEFINED_ENTITY)) {

+ if (((ent->checked & 1) || (ent->checked == 0)) &&

+ (ent->content != NULL) && (xmlStrchr(ent->content, '<'))) {

+ xmlFatalErrMsgStr(ctxt, XML_ERR_LT_IN_ATTRIBUTE,

+ "'<' in entity '%s' is not allowed in attributes values\n", name);

+ }

}

@@ -7337,7 +7741,7 @@ xmlParseEntityRef(xmlParserCtxtPtr ctxt) {

* [ WFC: No Recursion ]

* A parsed entity must not contain a recursive reference

- * to itself, either directly or indirectly.

+ * to itself, either directly or indirectly.

* Done somewhere else

return(ent);

@@ -7406,7 +7810,7 @@ xmlParseStringEntityRef(xmlParserCtxtPtr ctxt, const xmlChar ** str) {

- * Predefined entites override any extra definition

+ * Predefined entities override any extra definition

if ((ctxt->options & XML_PARSE_OLDSAX) == 0) {

ent = xmlGetPredefinedEntity(name);

@@ -7459,7 +7863,7 @@ xmlParseStringEntityRef(xmlParserCtxtPtr ctxt, const xmlChar ** str) {

* is not obligated to read and process their declarations;

* for such documents, the rule that an entity must be

* declared is a well-formedness constraint only if

- * standalone='yes'.

+ * standalone='yes'.

if (ent == NULL) {

if ((ctxt->standalone == 1) ||

@@ -7472,6 +7876,7 @@ xmlParseStringEntityRef(xmlParserCtxtPtr ctxt, const xmlChar ** str) {

"Entity '%s' not defined\n",

name);

}

+ xmlParserEntityCheck(ctxt, 0, ent, 0);

/* TODO ? check regressions ctxt->valid = 0; */

}

@@ -7550,7 +7955,7 @@ xmlParseStringEntityRef(xmlParserCtxtPtr ctxt, const xmlChar ** str) {

* [ WFC: No Recursion ]

* A parsed entity must not contain a recursive

- * reference to itself, either directly or indirectly.

+ * reference to itself, either directly or indirectly.

* [ WFC: Entity Declared ]

* In a document without any DTD, a document with only an internal DTD

@@ -7631,6 +8036,7 @@ xmlParsePEReference(xmlParserCtxtPtr ctxt)

name, NULL);

ctxt->valid = 0;

}

+ xmlParserEntityCheck(ctxt, 0, NULL, 0);

} else {

* Internal checking in case the entity quest barfed

@@ -7732,7 +8138,7 @@ xmlLoadEntityContent(xmlParserCtxtPtr ctxt, xmlEntityPtr entity) {

while ((ctxt->input == input) && (ctxt->input->cur < ctxt->input->end) &&

(IS_CHAR(c))) {

xmlBufferAdd(buf, ctxt->input->cur, l);

- if (count++ > 100) {

+ if (count++ > XML_PARSER_CHUNK_SIZE) {

count = 0;

GROW;

if (ctxt->instate == XML_PARSER_EOF) {

@@ -7742,6 +8148,15 @@ xmlLoadEntityContent(xmlParserCtxtPtr ctxt, xmlEntityPtr entity) {

}

NEXTL(l);

c = CUR_CHAR(l);

+ if (c == 0) {

+ count = 0;

+ GROW;

+ if (ctxt->instate == XML_PARSER_EOF) {

+ xmlBufferFree(buf);

+ return(-1);

+ }

+ c = CUR_CHAR(l);

+ }

}

if ((ctxt->input == input) && (ctxt->input->cur >= ctxt->input->end)) {

@@ -7861,6 +8276,7 @@ xmlParseStringPEReference(xmlParserCtxtPtr ctxt, const xmlChar **str) {

name, NULL);

ctxt->valid = 0;

}

+ xmlParserEntityCheck(ctxt, 0, NULL, 0);

} else {

* Internal checking in case the entity quest barfed

@@ -7884,12 +8300,12 @@ xmlParseStringPEReference(xmlParserCtxtPtr ctxt, const xmlChar **str) {

* parse a DOCTYPE declaration

- * [28] doctypedecl ::= '<!DOCTYPE' S Name (S ExternalID)? S?

+ * [28] doctypedecl ::= '<!DOCTYPE' S Name (S ExternalID)? S?

* ('[' (markupdecl | PEReference | S)* ']' S?)? '>'

* [ VC: Root Element Type ]

* The Name in the document type declaration must match the element

- * type of the root element.

+ * type of the root element.

void

@@ -7973,7 +8389,7 @@ xmlParseInternalSubset(xmlParserCtxtPtr ctxt) {

ctxt->instate = XML_PARSER_DTD;

NEXT;

- * Parse the succession of Markup declarations and

+ * Parse the succession of Markup declarations and

* PEReferences.

* Subsequence (markupdecl | PEReference | S)*

@@ -7997,7 +8413,7 @@ xmlParseInternalSubset(xmlParserCtxtPtr ctxt) {

break;

}

- if (RAW == ']') {

+ if (RAW == ']') {

NEXT;

SKIP_BLANKS;

}

@@ -8028,8 +8444,8 @@ xmlParseInternalSubset(xmlParserCtxtPtr ctxt) {

* [ WFC: No < in Attribute Values ]

* The replacement text of any entity referred to directly or indirectly in

- * an attribute value (other than "<") must not contain a <.

- *

+ * an attribute value (other than "<") must not contain a <.

+ *

* [ VC: Attribute Value Type ]

* The attribute must have been declared; the value must be of the type

* declared for it.

@@ -8110,7 +8526,7 @@ xmlParseAttribute(xmlParserCtxtPtr ctxt, xmlChar **value) {

/**

* xmlParseStartTag:

* @ctxt: an XML parser context

- *

+ *

* parse a start of tag either for rule element or

* EmptyElement. In both case we don't parse the tag closing chars.

@@ -8118,13 +8534,13 @@ xmlParseAttribute(xmlParserCtxtPtr ctxt, xmlChar **value) {

* [ WFC: Unique Att Spec ]

* No attribute name may appear more than once in the same start-tag or

- * empty-element tag.

+ * empty-element tag.

* [44] EmptyElemTag ::= '<' Name (S Attribute)* S? '/>'

* [ WFC: Unique Att Spec ]

* No attribute name may appear more than once in the same start-tag or

- * empty-element tag.

+ * empty-element tag.

* With namespace:

@@ -8163,7 +8579,7 @@ xmlParseStartTag(xmlParserCtxtPtr ctxt) {

SKIP_BLANKS;

GROW;

- while (((RAW != '>') &&

+ while (((RAW != '>') &&

((RAW != '/') || (NXT(1) != '>')) &&

(IS_BYTE_CHAR(RAW))) && (ctxt->instate != XML_PARSER_EOF)) {

const xmlChar *q = CUR_PTR;

@@ -8174,7 +8590,7 @@ xmlParseStartTag(xmlParserCtxtPtr ctxt) {

* [ WFC: Unique Att Spec ]

* No attribute name may appear more than once in the same

- * start-tag or empty-element tag.

+ * start-tag or empty-element tag.

for (i = 0; i < nbatts;i += 2) {

if (xmlStrEqual(atts[i], attname)) {

@@ -8223,7 +8639,7 @@ xmlParseStartTag(xmlParserCtxtPtr ctxt) {

xmlFree(attvalue);

}

-failed:

+failed:

GROW

if ((RAW == '>') || (((RAW == '/') && (NXT(1) == '>'))))

@@ -8305,7 +8721,7 @@ xmlParseEndTag1(xmlParserCtxtPtr ctxt, int line) {

* [ WFC: Element Type Match ]

* The Name in an element's end-tag must match the element type in the

- * start-tag.

+ * start-tag.

if (name != (xmlChar*)1) {

@@ -8401,7 +8817,7 @@ xmlParseQName(xmlParserCtxtPtr ctxt, const xmlChar **prefix) {

if (CUR == ':') {

l = xmlParseName(ctxt);

if (l != NULL) {

- xmlNsErr(ctxt, XML_NS_ERR_QNAME,

+ xmlNsErr(ctxt, XML_NS_ERR_QNAME,

"Failed to parse QName '%s'\n", l, NULL, NULL);

*prefix = NULL;

return(l);

@@ -8484,7 +8900,7 @@ xmlParseQNameAndCompare(xmlParserCtxtPtr ctxt, xmlChar const *name,

cmp = prefix;

while (*in != 0 && *in == *cmp) {

- ++in;

+ ++in;

++cmp;

}

if ((*cmp == 0) && (*in == ':')) {

@@ -8522,20 +8938,20 @@ xmlParseQNameAndCompare(xmlParserCtxtPtr ctxt, xmlChar const *name,