566012 part 2 fix regresion tests and push mode

* test/utf16bebom.xml: regression test showed that this test case was
  broken but previous behaviour would not detect it !
* parser.c: fix 566012 for the push mode of the parser, tricky !
* test/ebcdic_566012.xml result//ebcdic_566012.xml*: add the test to the
  regression suite
This commit is contained in:
Daniel Veillard 2009-08-26 14:37:00 +02:00
parent 7e385bd4e2
commit a6c76a26ca
9 changed files with 66 additions and 5 deletions

View File

@ -10007,6 +10007,12 @@ xmlParseXMLDecl(xmlParserCtxtPtr ctxt) {
} }
xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED, "Blank needed here\n"); xmlFatalErrMsg(ctxt, XML_ERR_SPACE_REQUIRED, "Blank needed here\n");
} }
/*
* We can grow the input buffer freely at that point
*/
GROW;
SKIP_BLANKS; SKIP_BLANKS;
ctxt->input->standalone = xmlParseSDDecl(ctxt); ctxt->input->standalone = xmlParseSDDecl(ctxt);
@ -11493,6 +11499,7 @@ int
xmlParseChunk(xmlParserCtxtPtr ctxt, const char *chunk, int size, xmlParseChunk(xmlParserCtxtPtr ctxt, const char *chunk, int size,
int terminate) { int terminate) {
int end_in_lf = 0; int end_in_lf = 0;
int remain = 0;
if (ctxt == NULL) if (ctxt == NULL)
return(XML_ERR_INTERNAL_ERROR); return(XML_ERR_INTERNAL_ERROR);
@ -11505,12 +11512,41 @@ xmlParseChunk(xmlParserCtxtPtr ctxt, const char *chunk, int size,
end_in_lf = 1; end_in_lf = 1;
size--; size--;
} }
xmldecl_done:
if ((size > 0) && (chunk != NULL) && (ctxt->input != NULL) && if ((size > 0) && (chunk != NULL) && (ctxt->input != NULL) &&
(ctxt->input->buf != NULL) && (ctxt->instate != XML_PARSER_EOF)) { (ctxt->input->buf != NULL) && (ctxt->instate != XML_PARSER_EOF)) {
int base = ctxt->input->base - ctxt->input->buf->buffer->content; int base = ctxt->input->base - ctxt->input->buf->buffer->content;
int cur = ctxt->input->cur - ctxt->input->base; int cur = ctxt->input->cur - ctxt->input->base;
int res; int res;
/*
* Specific handling if we autodetected an encoding, we should not
* push more than the first line ... which depend on the encoding
* And only push the rest once the final encoding was detected
*/
if ((ctxt->instate == XML_PARSER_START) && (ctxt->input != NULL) &&
(ctxt->input->buf != NULL) && (ctxt->input->buf->encoder != NULL)) {
int len = 45;
if ((xmlStrcasestr(BAD_CAST ctxt->input->buf->encoder->name,
BAD_CAST "UTF-16")) ||
(xmlStrcasestr(BAD_CAST ctxt->input->buf->encoder->name,
BAD_CAST "UTF16")))
len = 90;
else if ((xmlStrcasestr(BAD_CAST ctxt->input->buf->encoder->name,
BAD_CAST "UCS-4")) ||
(xmlStrcasestr(BAD_CAST ctxt->input->buf->encoder->name,
BAD_CAST "UCS4")))
len = 180;
if (ctxt->input->buf->rawconsumed < len)
len -= ctxt->input->buf->rawconsumed;
remain = size - len;
size = len;
}
res =xmlParserInputBufferPush(ctxt->input->buf, size, chunk); res =xmlParserInputBufferPush(ctxt->input->buf, size, chunk);
if (res < 0) { if (res < 0) {
ctxt->errNo = XML_PARSER_EOF; ctxt->errNo = XML_PARSER_EOF;
@ -11542,13 +11578,23 @@ xmlParseChunk(xmlParserCtxtPtr ctxt, const char *chunk, int size,
} }
} }
} }
if (remain != 0)
xmlParseTryOrFinish(ctxt, 0);
else
xmlParseTryOrFinish(ctxt, terminate); xmlParseTryOrFinish(ctxt, terminate);
if ((ctxt->errNo != XML_ERR_OK) && (ctxt->disableSAX == 1))
return(ctxt->errNo);
if (remain != 0) {
chunk += size;
size = remain;
remain = 0;
goto xmldecl_done;
}
if ((end_in_lf == 1) && (ctxt->input != NULL) && if ((end_in_lf == 1) && (ctxt->input != NULL) &&
(ctxt->input->buf != NULL)) { (ctxt->input->buf != NULL)) {
xmlParserInputBufferPush(ctxt->input->buf, 1, "\r"); xmlParserInputBufferPush(ctxt->input->buf, 1, "\r");
} }
if ((ctxt->errNo != XML_ERR_OK) && (ctxt->disableSAX == 1))
return(ctxt->errNo);
if (terminate) { if (terminate) {
/* /*
* Check for termination * Check for termination

1
result/ebcdic_566012.xml Normal file
View File

@ -0,0 +1 @@
Lo§”“@¥…™¢‰–•~ñKð@…•ƒ–„‰•‡~ÉÂÔ`ññôñon%L£…¢£@<40>££™~JàZan%

View File

@ -0,0 +1 @@
0 1 test 1 0

View File

@ -0,0 +1 @@
0 1 test 1 0

View File

@ -0,0 +1,5 @@
SAX.setDocumentLocator()
SAX.startDocument()
SAX.startElement(test, attr='ÄÖÜ')
SAX.endElement(test)
SAX.endDocument()

View File

@ -0,0 +1,5 @@
SAX.setDocumentLocator()
SAX.startDocument()
SAX.startElementNs(test, NULL, NULL, 0, 1, 0, attr='ÄÖ...', 6)
SAX.endElementNs(test, NULL, NULL)
SAX.endDocument()

View File

@ -0,0 +1 @@
Lo§”“@¥…™¢‰–•~ñKð@…•ƒ–„‰•‡~ÉÂÔ`ññôñon%L£…¢£@<40>££™~JàZan%

1
test/ebcdic_566012.xml Normal file
View File

@ -0,0 +1 @@
Lo§”“@¥…™¢‰–•~ñKð@…•ƒ–„‰•‡~ÉÂÔ`ññôñ@on%L£…¢£@<40>££™~JàZ@an%

Binary file not shown.