parser: Fix detection of duplicate attributes

We really need a second scan if more than one namespace clash was
detected.
This commit is contained in:
Nick Wellnhofer 2024-10-28 20:12:52 +01:00
parent 89b9f45711
commit ffb058f484
5 changed files with 101 additions and 0 deletions

View File

@ -8928,6 +8928,35 @@ xmlAttrHashInsert(xmlParserCtxtPtr ctxt, unsigned size, const xmlChar *name,
return(INT_MAX);
}
static int
xmlAttrHashInsertQName(xmlParserCtxtPtr ctxt, unsigned size,
const xmlChar *name, const xmlChar *prefix,
unsigned hashValue, int aindex) {
xmlAttrHashBucket *table = ctxt->attrHash;
xmlAttrHashBucket *bucket;
unsigned hindex;
hindex = hashValue & (size - 1);
bucket = &table[hindex];
while (bucket->index >= 0) {
const xmlChar **atts = &ctxt->atts[bucket->index];
if ((name == atts[0]) && (prefix == atts[1]))
return(bucket->index);
hindex++;
bucket++;
if (hindex >= size) {
hindex = 0;
bucket = table;
}
}
bucket->index = aindex;
return(INT_MAX);
}
/**
* xmlParseStartTag2:
* @ctxt: an XML parser context
@ -8976,6 +9005,8 @@ xmlParseStartTag2(xmlParserCtxtPtr ctxt, const xmlChar **pref,
int nratts, nbatts, nbdef;
int i, j, nbNs, nbTotalDef, attval, nsIndex, maxAtts;
int alloc = 0;
int numNsErr = 0;
int numDupErr = 0;
if (RAW != '<') return(NULL);
NEXT1;
@ -9354,10 +9385,12 @@ next_attr:
if (res < INT_MAX) {
if (aprefix == atts[res+1]) {
xmlErrAttributeDup(ctxt, aprefix, attname);
numDupErr += 1;
} else {
xmlNsErr(ctxt, XML_NS_ERR_ATTRIBUTE_REDEFINED,
"Namespaced Attribute %s in '%s' redefined\n",
attname, nsuri, NULL);
numNsErr += 1;
}
}
}
@ -9456,6 +9489,43 @@ next_attr:
}
}
/*
* Using a single hash table for nsUri/localName pairs cannot
* detect duplicate QNames reliably. The following example will
* only result in two namespace errors.
*
* <doc xmlns:a="a" xmlns:b="a">
* <elem a:a="" b:a="" b:a=""/>
* </doc>
*
* If we saw more than one namespace error but no duplicate QNames
* were found, we have to scan for duplicate QNames.
*/
if ((numDupErr == 0) && (numNsErr > 1)) {
memset(ctxt->attrHash, -1,
attrHashSize * sizeof(ctxt->attrHash[0]));
for (i = 0, j = 0; j < nratts; i += 5, j++) {
unsigned hashValue, nameHashValue, prefixHashValue;
int res;
aprefix = atts[i+1];
if (aprefix == NULL)
continue;
attname = atts[i];
/* Hash values always have bit 31 set, see dict.c */
nameHashValue = ctxt->attallocs[j] | 0x80000000;
prefixHashValue = xmlDictComputeHash(ctxt->dict, aprefix);
hashValue = xmlDictCombineHash(nameHashValue, prefixHashValue);
res = xmlAttrHashInsertQName(ctxt, attrHashSize, attname,
aprefix, hashValue, i);
if (res < INT_MAX)
xmlErrAttributeDup(ctxt, aprefix, attname);
}
}
/*
* Reconstruct attribute pointers
*/

View File

@ -0,0 +1,9 @@
./test/errors/dup-xml-attr2.xml:2: namespace error : Namespaced Attribute a in 'urn:a' redefined
<elem a:a="" b:a="" b:a=""/>
^
./test/errors/dup-xml-attr2.xml:2: namespace error : Namespaced Attribute a in 'urn:a' redefined
<elem a:a="" b:a="" b:a=""/>
^
./test/errors/dup-xml-attr2.xml:2: parser error : Attribute b:a redefined
<elem a:a="" b:a="" b:a=""/>
^

View File

@ -0,0 +1,9 @@
./test/errors/dup-xml-attr2.xml:2: namespace error : Namespaced Attribute a in 'urn:a' redefined
<elem a:a="" b:a="" b:a=""/>
^
./test/errors/dup-xml-attr2.xml:2: namespace error : Namespaced Attribute a in 'urn:a' redefined
<elem a:a="" b:a="" b:a=""/>
^
./test/errors/dup-xml-attr2.xml:2: parser error : Attribute b:a redefined
<elem a:a="" b:a="" b:a=""/>
^

View File

@ -0,0 +1,10 @@
./test/errors/dup-xml-attr2.xml:2: namespace error : Namespaced Attribute a in 'urn:a' redefined
<elem a:a="" b:a="" b:a=""/>
^
./test/errors/dup-xml-attr2.xml:2: namespace error : Namespaced Attribute a in 'urn:a' redefined
<elem a:a="" b:a="" b:a=""/>
^
./test/errors/dup-xml-attr2.xml:2: parser error : Attribute b:a redefined
<elem a:a="" b:a="" b:a=""/>
^
./test/errors/dup-xml-attr2.xml : failed to parse

View File

@ -0,0 +1,3 @@
<doc xmlns:a="urn:a" xmlns:b="urn:a">
<elem a:a="" b:a="" b:a=""/>
</doc>