Fix regression parsing public IDs literals in HTML

Fix regression introduced when reworking htmlParsePubidLiteral in
commit 93ce33c2.

Fixes #318.
This commit is contained in:
Nick Wellnhofer 2022-01-10 13:32:14 +01:00
parent dea91c97de
commit 2732b23466
5 changed files with 35 additions and 1 deletions

View File

@ -3045,7 +3045,7 @@ htmlParsePubidLiteral(htmlParserCtxtPtr ctxt) {
NEXT;
}
if (CUR != '"') {
if (CUR != quote) {
htmlParseErr(ctxt, XML_ERR_LITERAL_NOT_FINISHED,
"Unfinished PubidLiteral\n", NULL, NULL);
} else {

View File

@ -0,0 +1,6 @@
<!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01//EN">
<html>
<head><meta http-equiv='\"content-type\"' content='\"text/html;charset=utf-8\"'></head>
<body>
</body>
</html>

View File

View File

@ -0,0 +1,22 @@
SAX.setDocumentLocator()
SAX.startDocument()
SAX.internalSubset(html, -//W3C//DTD HTML 4.01//EN, )
SAX.startElement(html)
SAX.characters(
, 1)
SAX.startElement(head)
SAX.startElement(meta, http-equiv='\"content-type\"', content='\"text/html;charset=utf-8\"')
SAX.endElement(meta)
SAX.endElement(head)
SAX.characters(
, 1)
SAX.startElement(body)
SAX.characters(
, 1)
SAX.endElement(body)
SAX.characters(
, 1)
SAX.endElement(html)
SAX.characters(
, 1)
SAX.endDocument()

6
test/HTML/issue318.html Normal file
View File

@ -0,0 +1,6 @@
<!DOCTYPE html PUBLIC '-//W3C//DTD HTML 4.01//EN'>
<html>
<head><meta http-equiv=\"content-type\" content=\"text/html;charset=utf-8\"></head>
<body>
</body>
</html>