libxml2/xmllint.c

3641 lines
101 KiB
C
Raw Permalink Normal View History

/*
* xmllint.c : a small tester program for XML input.
*
* See Copyright for the status of this software.
*
* daniel@veillard.com
*/
2001-04-21 16:57:29 +00:00
#include "libxml.h"
#include <string.h>
#include <stdarg.h>
2022-12-08 03:45:37 +01:00
#include <stdio.h>
#include <stdlib.h>
#include <errno.h>
#include <limits.h>
#include <fcntl.h>
#ifdef _WIN32
#include <io.h>
#include <sys/timeb.h>
#else
#include <sys/time.h>
#include <unistd.h>
#endif
#if HAVE_DECL_MMAP
#include <sys/mman.h>
#include <sys/stat.h>
/* seems needed for Solaris */
#ifndef MAP_FAILED
#define MAP_FAILED ((void *) -1)
#endif
#endif
#include <libxml/xmlmemory.h>
#include <libxml/parser.h>
#include <libxml/parserInternals.h>
#include <libxml/HTMLparser.h>
#include <libxml/HTMLtree.h>
#include <libxml/tree.h>
#include <libxml/xpath.h>
#include <libxml/xpathInternals.h>
#include <libxml/debugXML.h>
#include <libxml/xmlerror.h>
#ifdef LIBXML_XINCLUDE_ENABLED
#include <libxml/xinclude.h>
#endif
#ifdef LIBXML_CATALOG_ENABLED
#include <libxml/catalog.h>
#endif
#include <libxml/xmlreader.h>
#ifdef LIBXML_SCHEMATRON_ENABLED
#include <libxml/schematron.h>
#endif
#ifdef LIBXML_RELAXNG_ENABLED
#include <libxml/relaxng.h>
#endif
#ifdef LIBXML_SCHEMAS_ENABLED
#include <libxml/xmlschemas.h>
#endif
#ifdef LIBXML_PATTERN_ENABLED
#include <libxml/pattern.h>
#endif
#ifdef LIBXML_C14N_ENABLED
#include <libxml/c14n.h>
#endif
#ifdef LIBXML_OUTPUT_ENABLED
#include <libxml/xmlsave.h>
#endif
#include "private/lint.h"
#ifndef STDIN_FILENO
#define STDIN_FILENO 0
#endif
#ifndef STDOUT_FILENO
#define STDOUT_FILENO 1
#endif
#define MAX_PATHS 64
#ifdef _WIN32
#define PATH_SEPARATOR ';'
#else
#define PATH_SEPARATOR ':'
#endif
#define HTML_BUF_SIZE 50000
/* Internal parser option */
#define XML_PARSE_UNZIP (1 << 24)
typedef enum {
XMLLINT_RETURN_OK = 0, /* No error */
XMLLINT_ERR_UNCLASS = 1, /* Unclassified */
XMLLINT_ERR_DTD = 2, /* Error in DTD */
XMLLINT_ERR_VALID = 3, /* Validation error */
XMLLINT_ERR_RDFILE = 4, /* CtxtReadFile error */
XMLLINT_ERR_SCHEMACOMP = 5, /* Schema compilation */
XMLLINT_ERR_OUT = 6, /* Error writing output */
XMLLINT_ERR_SCHEMAPAT = 7, /* Error in schema pattern */
/*XMLLINT_ERR_RDREGIS = 8,*/
XMLLINT_ERR_MEM = 9, /* Out of memory error */
XMLLINT_ERR_XPATH = 10, /* XPath evaluation error */
XMLLINT_ERR_XPATH_EMPTY = 11 /* XPath result is empty */
} xmllintReturnCode;
#ifdef _WIN32
typedef __time64_t xmlSeconds;
#else
typedef time_t xmlSeconds;
#endif
typedef struct {
xmlSeconds sec;
int usec;
} xmlTime;
typedef struct {
FILE *errStream;
xmlParserCtxtPtr ctxt;
xmlResourceLoader defaultResourceLoader;
int version;
int maxmem;
int nowrap;
int sax;
int callbacks;
int shell;
#ifdef LIBXML_DEBUG_ENABLED
int debugent;
#endif
int debug;
int copy;
int noout;
#ifdef LIBXML_OUTPUT_ENABLED
const char *output;
int format;
const char *encoding;
int compress;
#endif /* LIBXML_OUTPUT_ENABLED */
#ifdef LIBXML_VALID_ENABLED
int postvalid;
const char *dtdvalid;
const char *dtdvalidfpi;
int insert;
#endif
#ifdef LIBXML_RELAXNG_ENABLED
const char *relaxng;
xmlRelaxNGPtr relaxngschemas;
#endif
#ifdef LIBXML_SCHEMAS_ENABLED
const char *schema;
xmlSchemaPtr wxschemas;
#endif
#ifdef LIBXML_SCHEMATRON_ENABLED
const char *schematron;
xmlSchematronPtr wxschematron;
#endif
int repeat;
#if defined(LIBXML_HTML_ENABLED)
int html;
int xmlout;
#endif
int htmlout;
#ifdef LIBXML_PUSH_ENABLED
int push;
#endif /* LIBXML_PUSH_ENABLED */
#if HAVE_DECL_MMAP
int memory;
char *memoryData;
size_t memorySize;
#endif
int testIO;
#ifdef LIBXML_XINCLUDE_ENABLED
int xinclude;
#endif
xmllintReturnCode progresult;
int quiet;
int timing;
int generate;
int dropdtd;
#ifdef LIBXML_C14N_ENABLED
int canonical;
int canonical_11;
int exc_canonical;
#endif
#ifdef LIBXML_READER_ENABLED
int stream;
int walker;
#ifdef LIBXML_PATTERN_ENABLED
const char *pattern;
xmlPatternPtr patternc;
xmlStreamCtxtPtr patstream;
#endif
#endif /* LIBXML_READER_ENABLED */
#ifdef LIBXML_XPATH_ENABLED
const char *xpathquery;
#endif
#ifdef LIBXML_CATALOG_ENABLED
int catalogs;
int nocatalogs;
#endif
int options;
unsigned maxAmpl;
xmlChar *paths[MAX_PATHS + 1];
int nbpaths;
int load_trace;
char *htmlBuf;
int htmlBufLen;
2025-02-25 20:09:36 +01:00
xmlTime begin;
xmlTime end;
} xmllintState;
static int xmllintMaxmem;
static int xmllintMaxmemReached;
static int xmllintOom;
/************************************************************************
* *
* Entity loading control and customization. *
* *
************************************************************************/
static void
parsePath(xmllintState *lint, const xmlChar *path) {
const xmlChar *cur;
if (path == NULL)
return;
while (*path != 0) {
if (lint->nbpaths >= MAX_PATHS) {
fprintf(lint->errStream, "MAX_PATHS reached: too many paths\n");
lint->progresult = XMLLINT_ERR_UNCLASS;
return;
}
cur = path;
while ((*cur == ' ') || (*cur == PATH_SEPARATOR))
cur++;
path = cur;
while ((*cur != 0) && (*cur != ' ') && (*cur != PATH_SEPARATOR))
cur++;
if (cur != path) {
lint->paths[lint->nbpaths] = xmlStrndup(path, cur - path);
if (lint->paths[lint->nbpaths] != NULL)
lint->nbpaths++;
path = cur;
}
}
}
static xmlParserErrors
xmllintResourceLoader(void *ctxt, const char *URL,
2025-03-13 23:20:16 +01:00
const char *ID, xmlResourceType type,
xmlParserInputFlags flags, xmlParserInputPtr *out) {
xmllintState *lint = ctxt;
xmlParserErrors code;
int i;
const char *lastsegment = URL;
const char *iter = URL;
if ((lint->nbpaths > 0) && (iter != NULL)) {
while (*iter != 0) {
if (*iter == '/')
lastsegment = iter + 1;
iter++;
}
}
if (lint->defaultResourceLoader != NULL)
code = lint->defaultResourceLoader(NULL, URL, ID, type, flags, out);
2024-06-11 18:14:43 +02:00
else
code = xmlNewInputFromUrl(URL, flags, out);
2024-06-11 18:14:43 +02:00
if (code != XML_IO_ENOENT) {
if ((lint->load_trace) && (code == XML_ERR_OK)) {
fprintf(lint->errStream, "Loaded URL=\"%s\" ID=\"%s\"\n",
2024-06-11 18:14:43 +02:00
URL, ID ? ID : "(null)");
}
return(code);
}
for (i = 0; i < lint->nbpaths; i++) {
xmlChar *newURL;
newURL = xmlStrdup((const xmlChar *) lint->paths[i]);
newURL = xmlStrcat(newURL, (const xmlChar *) "/");
newURL = xmlStrcat(newURL, (const xmlChar *) lastsegment);
if (newURL != NULL) {
if (lint->defaultResourceLoader != NULL)
code = lint->defaultResourceLoader(NULL, (const char *) newURL,
ID, type, flags, out);
2024-06-11 18:14:43 +02:00
else
code = xmlNewInputFromUrl((const char *) newURL, flags, out);
2024-06-11 18:14:43 +02:00
if (code != XML_IO_ENOENT) {
if ((lint->load_trace) && (code == XML_ERR_OK)) {
fprintf(lint->errStream, "Loaded URL=\"%s\" ID=\"%s\"\n",
2024-06-11 18:14:43 +02:00
newURL, ID ? ID : "(null)");
}
xmlFree(newURL);
return(code);
}
xmlFree(newURL);
}
}
2024-06-11 18:14:43 +02:00
return(XML_IO_ENOENT);
}
2024-05-13 12:18:08 +02:00
/************************************************************************
* *
* Core parsing functions *
* *
************************************************************************/
static int
myRead(void *f, char *buf, int len) {
return(fread(buf, 1, len, (FILE *) f));
}
static int
myClose(void *context) {
FILE *f = (FILE *) context;
if (f == stdin)
return(0);
return(fclose(f));
}
static xmlDocPtr
parseXml(xmllintState *lint, const char *filename) {
xmlParserCtxtPtr ctxt = lint->ctxt;
xmlDocPtr doc;
#ifdef LIBXML_PUSH_ENABLED
if (lint->push) {
FILE *f;
int res;
char chars[4096];
if ((filename[0] == '-') && (filename[1] == 0)) {
f = stdin;
} else {
f = fopen(filename, "rb");
if (f == NULL) {
fprintf(lint->errStream, "Can't open %s\n", filename);
lint->progresult = XMLLINT_ERR_RDFILE;
return(NULL);
}
}
while ((res = fread(chars, 1, 4096, f)) > 0) {
xmlParseChunk(ctxt, chars, res, 0);
}
xmlParseChunk(ctxt, chars, 0, 1);
doc = ctxt->myDoc;
ctxt->myDoc = NULL;
if (f != stdin)
fclose(f);
/*
* The push parser leaves non-wellformed documents
* in ctxt->myDoc.
*/
if (!ctxt->wellFormed) {
xmlFreeDoc(doc);
doc = NULL;
}
return(doc);
}
#endif /* LIBXML_PUSH_ENABLED */
#if HAVE_DECL_MMAP
if (lint->memory) {
xmlParserInputPtr input;
input = xmlNewInputFromMemory(filename,
lint->memoryData, lint->memorySize,
XML_INPUT_BUF_STATIC);
if (input == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
return(NULL);
}
doc = xmlCtxtParseDocument(ctxt, input);
return(doc);
}
#endif
if (lint->testIO) {
FILE *f;
if ((filename[0] == '-') && (filename[1] == 0)) {
f = stdin;
} else {
f = fopen(filename, "rb");
if (f == NULL) {
fprintf(lint->errStream, "Can't open %s\n", filename);
lint->progresult = XMLLINT_ERR_RDFILE;
return(NULL);
}
}
doc = xmlCtxtReadIO(ctxt, myRead, myClose, f, filename, NULL,
lint->options);
} else {
if (strcmp(filename, "-") == 0)
doc = xmlCtxtReadFd(ctxt, STDIN_FILENO, "-", NULL,
lint->options | XML_PARSE_UNZIP);
else
doc = xmlCtxtReadFile(ctxt, filename, NULL,
lint->options | XML_PARSE_UNZIP);
}
return(doc);
}
#ifdef LIBXML_HTML_ENABLED
static xmlDocPtr
parseHtml(xmllintState *lint, const char *filename) {
xmlParserCtxtPtr ctxt = lint->ctxt;
xmlDocPtr doc;
#ifdef LIBXML_PUSH_ENABLED
if (lint->push) {
FILE *f;
int res;
char chars[4096];
if ((filename[0] == '-') && (filename[1] == 0)) {
f = stdin;
} else {
f = fopen(filename, "rb");
if (f == NULL) {
fprintf(lint->errStream, "Can't open %s\n", filename);
lint->progresult = XMLLINT_ERR_RDFILE;
return(NULL);
}
}
while ((res = fread(chars, 1, 4096, f)) > 0) {
htmlParseChunk(ctxt, chars, res, 0);
}
htmlParseChunk(ctxt, chars, 0, 1);
doc = ctxt->myDoc;
ctxt->myDoc = NULL;
if (f != stdin)
fclose(f);
return(doc);
}
#endif /* LIBXML_PUSH_ENABLED */
#if HAVE_DECL_MMAP
if (lint->memory) {
xmlParserInputPtr input;
input = xmlNewInputFromMemory(filename,
lint->memoryData, lint->memorySize,
XML_INPUT_BUF_STATIC);
if (input == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
return(NULL);
}
doc = htmlCtxtParseDocument(ctxt, input);
return(doc);
}
#endif
if (strcmp(filename, "-") == 0)
doc = htmlCtxtReadFd(ctxt, STDIN_FILENO, "-", NULL,
lint->options);
else
doc = htmlCtxtReadFile(ctxt, filename, NULL, lint->options);
return(doc);
}
#endif /* LIBXML_HTML_ENABLED */
/************************************************************************
* *
* Memory allocation consumption debugging *
* *
************************************************************************/
#define XMLLINT_ABORT_ON_FAILURE 0
static void
myFreeFunc(void *mem) {
xmlMemFree(mem);
}
static void *
myMallocFunc(size_t size) {
void *ret;
if (xmlMemUsed() + size > (size_t) xmllintMaxmem) {
#if XMLLINT_ABORT_ON_FAILURE
abort();
#endif
xmllintMaxmemReached = 1;
xmllintOom = 1;
return(NULL);
}
ret = xmlMemMalloc(size);
if (ret == NULL)
xmllintOom = 1;
return(ret);
}
static void *
myReallocFunc(void *mem, size_t size) {
void *ret;
size_t oldsize = xmlMemSize(mem);
if (xmlMemUsed() + size - oldsize > (size_t) xmllintMaxmem) {
#if XMLLINT_ABORT_ON_FAILURE
abort();
#endif
xmllintMaxmemReached = 1;
xmllintOom = 1;
return(NULL);
}
ret = xmlMemRealloc(mem, size);
if (ret == NULL)
xmllintOom = 1;
return(ret);
}
static char *
myStrdupFunc(const char *str) {
size_t size;
char *ret;
if (str == NULL)
return(NULL);
size = strlen(str) + 1;
if (xmlMemUsed() + size > (size_t) xmllintMaxmem) {
#if XMLLINT_ABORT_ON_FAILURE
abort();
#endif
xmllintMaxmemReached = 1;
xmllintOom = 1;
return(NULL);
}
ret = xmlMemMalloc(size);
if (ret == NULL) {
xmllintOom = 1;
return(NULL);
}
memcpy(ret, str, size);
return(ret);
}
/************************************************************************
* *
* Internal timing routines to remove the necessity to have *
* unix-specific function calls. *
* *
************************************************************************/
static void
getTime(xmlTime *time) {
#ifdef _WIN32
struct __timeb64 timebuffer;
_ftime64(&timebuffer);
time->sec = timebuffer.time;
time->usec = timebuffer.millitm * 1000;
#else /* _WIN32 */
struct timeval tv;
gettimeofday(&tv, NULL);
time->sec = tv.tv_sec;
time->usec = tv.tv_usec;
#endif /* _WIN32 */
}
/*
* startTimer: call where you want to start timing
*/
static void
startTimer(xmllintState *lint)
{
getTime(&lint->begin);
}
/*
* endTimer: call where you want to stop timing and to print out a
* message about the timing performed; format is a printf
* type argument
*/
static void LIBXML_ATTR_FORMAT(2,3)
endTimer(xmllintState *lint, const char *fmt, ...)
{
xmlSeconds msec;
va_list ap;
getTime(&lint->end);
msec = lint->end.sec - lint->begin.sec;
msec *= 1000;
msec += (lint->end.usec - lint->begin.usec) / 1000;
va_start(ap, fmt);
vfprintf(lint->errStream, fmt, ap);
va_end(ap);
fprintf(lint->errStream, " took %ld ms\n", (long) msec);
}
/************************************************************************
* *
2019-09-30 17:04:54 +02:00
* HTML output *
* *
************************************************************************/
static void
xmlHTMLEncodeSend(xmllintState *lint) {
char *result;
/*
* xmlEncodeEntitiesReentrant assumes valid UTF-8, but the buffer might
* end with a truncated UTF-8 sequence. This is a hack to at least avoid
* an out-of-bounds read.
*/
memset(&lint->htmlBuf[HTML_BUF_SIZE - 4], 0, 4);
result = (char *) xmlEncodeEntitiesReentrant(NULL, BAD_CAST lint->htmlBuf);
if (result) {
fprintf(lint->errStream, "%s", result);
xmlFree(result);
}
lint->htmlBufLen = 0;
2024-06-10 23:05:40 +02:00
}
static void
xmlHTMLBufCat(void *data, const char *fmt, ...) {
xmllintState *lint = data;
2024-06-10 23:05:40 +02:00
va_list ap;
int res;
2024-06-10 23:05:40 +02:00
va_start(ap, fmt);
res = vsnprintf(&lint->htmlBuf[lint->htmlBufLen],
HTML_BUF_SIZE - lint->htmlBufLen, fmt, ap);
2024-06-10 23:05:40 +02:00
va_end(ap);
if (res > 0) {
if (res > HTML_BUF_SIZE - lint->htmlBufLen - 1)
lint->htmlBufLen = HTML_BUF_SIZE - 1;
2024-06-10 23:05:40 +02:00
else
lint->htmlBufLen += res;
}
}
/**
* xmlHTMLError:
* @ctx: an XML parser context
* @msg: the message to display/transmit
* @...: extra parameters for the message display
*
* Display and format an error messages, gives file, line, position and
* extra parameters.
*/
static void
xmlHTMLError(void *vctxt, const xmlError *error)
{
xmlParserCtxtPtr ctxt = vctxt;
xmllintState *lint = ctxt->_private;
2024-06-10 23:05:40 +02:00
xmlParserInputPtr input;
xmlGenericErrorFunc oldError;
void *oldErrorCtxt;
2024-06-10 23:05:40 +02:00
input = ctxt->input;
if ((input != NULL) && (input->filename == NULL) && (ctxt->inputNr > 1)) {
input = ctxt->inputTab[ctxt->inputNr - 2];
}
2024-06-10 23:05:40 +02:00
oldError = xmlGenericError;
oldErrorCtxt = xmlGenericErrorContext;
xmlSetGenericErrorFunc(lint, xmlHTMLBufCat);
2024-06-10 23:05:40 +02:00
fprintf(lint->errStream, "<p>");
2024-06-10 23:05:40 +02:00
xmlParserPrintFileInfo(input);
xmlHTMLEncodeSend(lint);
2024-06-10 23:05:40 +02:00
fprintf(lint->errStream, "<b>%s%s</b>: ",
(error->domain == XML_FROM_VALID) ||
(error->domain == XML_FROM_DTD) ? "validity " : "",
error->level == XML_ERR_WARNING ? "warning" : "error");
2024-06-10 23:05:40 +02:00
snprintf(lint->htmlBuf, HTML_BUF_SIZE, "%s", error->message);
xmlHTMLEncodeSend(lint);
2024-06-10 23:05:40 +02:00
fprintf(lint->errStream, "</p>\n");
2024-06-10 23:05:40 +02:00
if (input != NULL) {
fprintf(lint->errStream, "<pre>\n");
2024-06-10 23:05:40 +02:00
xmlParserPrintFileContext(input);
xmlHTMLEncodeSend(lint);
2024-06-10 23:05:40 +02:00
fprintf(lint->errStream, "</pre>");
2024-06-10 23:05:40 +02:00
}
xmlSetGenericErrorFunc(oldErrorCtxt, oldError);
}
/************************************************************************
* *
* SAX based tests *
* *
************************************************************************/
/*
* empty SAX block
*/
static const xmlSAXHandler emptySAXHandler = {
NULL, /* internalSubset */
NULL, /* isStandalone */
NULL, /* hasInternalSubset */
NULL, /* hasExternalSubset */
NULL, /* resolveEntity */
NULL, /* getEntity */
NULL, /* entityDecl */
NULL, /* notationDecl */
NULL, /* attributeDecl */
NULL, /* elementDecl */
NULL, /* unparsedEntityDecl */
NULL, /* setDocumentLocator */
NULL, /* startDocument */
NULL, /* endDocument */
NULL, /* startElement */
NULL, /* endElement */
NULL, /* reference */
NULL, /* characters */
NULL, /* ignorableWhitespace */
NULL, /* processingInstruction */
NULL, /* comment */
NULL, /* xmlParserWarning */
NULL, /* xmlParserError */
NULL, /* xmlParserError */
NULL, /* getParameterEntity */
NULL, /* cdataBlock; */
NULL, /* externalSubset; */
XML_SAX2_MAGIC,
NULL,
NULL, /* startElementNs */
NULL, /* endElementNs */
NULL /* xmlStructuredErrorFunc */
};
/**
* isStandaloneDebug:
* @ctxt: An XML parser context
*
* Is this document tagged standalone ?
*
* Returns 1 if true
*/
static int
isStandaloneDebug(void *ctx)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return(0);
fprintf(stdout, "SAX.isStandalone()\n");
return(0);
}
/**
* hasInternalSubsetDebug:
* @ctxt: An XML parser context
*
* Does this document has an internal subset
*
* Returns 1 if true
*/
static int
hasInternalSubsetDebug(void *ctx)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return(0);
fprintf(stdout, "SAX.hasInternalSubset()\n");
return(0);
}
/**
* hasExternalSubsetDebug:
* @ctxt: An XML parser context
*
* Does this document has an external subset
*
* Returns 1 if true
*/
static int
hasExternalSubsetDebug(void *ctx)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return(0);
fprintf(stdout, "SAX.hasExternalSubset()\n");
return(0);
}
/**
* internalSubsetDebug:
* @ctxt: An XML parser context
*
* Does this document has an internal subset
*/
static void
internalSubsetDebug(void *ctx, const xmlChar *name,
const xmlChar *ExternalID, const xmlChar *SystemID)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.internalSubset(%s,", name);
if (ExternalID == NULL)
fprintf(stdout, " ,");
else
fprintf(stdout, " %s,", ExternalID);
if (SystemID == NULL)
fprintf(stdout, " )\n");
else
fprintf(stdout, " %s)\n", SystemID);
}
/**
* externalSubsetDebug:
* @ctxt: An XML parser context
*
* Does this document has an external subset
*/
static void
externalSubsetDebug(void *ctx, const xmlChar *name,
const xmlChar *ExternalID, const xmlChar *SystemID)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.externalSubset(%s,", name);
if (ExternalID == NULL)
fprintf(stdout, " ,");
else
fprintf(stdout, " %s,", ExternalID);
if (SystemID == NULL)
fprintf(stdout, " )\n");
else
fprintf(stdout, " %s)\n", SystemID);
}
/**
* resolveEntityDebug:
* @ctxt: An XML parser context
* @publicId: The public ID of the entity
* @systemId: The system ID of the entity
*
* Special entity resolver, better left to the parser, it has
* more context than the application layer.
* The default behaviour is to NOT resolve the entities, in that case
* the ENTITY_REF nodes are built in the structure (and the parameter
* values).
*
* Returns the xmlParserInputPtr if inlined or NULL for DOM behaviour.
*/
static xmlParserInputPtr
resolveEntityDebug(void *ctx, const xmlChar *publicId, const xmlChar *systemId)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return(NULL);
/* xmlParserCtxtPtr ctxt = (xmlParserCtxtPtr) ctx; */
fprintf(stdout, "SAX.resolveEntity(");
if (publicId != NULL)
fprintf(stdout, "%s", (char *)publicId);
else
fprintf(stdout, " ");
if (systemId != NULL)
fprintf(stdout, ", %s)\n", (char *)systemId);
else
fprintf(stdout, ", )\n");
return(NULL);
}
/**
* getEntityDebug:
* @ctxt: An XML parser context
* @name: The entity name
*
* Get an entity by name
*
* Returns the xmlParserInputPtr if inlined or NULL for DOM behaviour.
*/
static xmlEntityPtr
getEntityDebug(void *ctx, const xmlChar *name)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return(NULL);
fprintf(stdout, "SAX.getEntity(%s)\n", name);
return(NULL);
}
/**
* getParameterEntityDebug:
* @ctxt: An XML parser context
* @name: The entity name
*
* Get a parameter entity by name
*
* Returns the xmlParserInputPtr
*/
static xmlEntityPtr
getParameterEntityDebug(void *ctx, const xmlChar *name)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return(NULL);
fprintf(stdout, "SAX.getParameterEntity(%s)\n", name);
return(NULL);
}
/**
* entityDeclDebug:
* @ctxt: An XML parser context
* @name: the entity name
* @type: the entity type
* @publicId: The public ID of the entity
* @systemId: The system ID of the entity
* @content: the entity value (without processing).
*
* An entity definition has been parsed
*/
static void
entityDeclDebug(void *ctx, const xmlChar *name, int type,
const xmlChar *publicId, const xmlChar *systemId, xmlChar *content)
{
xmllintState *lint = ctx;
const xmlChar *nullstr = BAD_CAST "(null)";
/* not all libraries handle printing null pointers nicely */
if (publicId == NULL)
publicId = nullstr;
if (systemId == NULL)
systemId = nullstr;
if (content == NULL)
content = (xmlChar *)nullstr;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.entityDecl(%s, %d, %s, %s, %s)\n",
name, type, publicId, systemId, content);
}
/**
* attributeDeclDebug:
* @ctxt: An XML parser context
* @name: the attribute name
* @type: the attribute type
*
* An attribute definition has been parsed
*/
static void
attributeDeclDebug(void *ctx, const xmlChar * elem,
const xmlChar * name, int type, int def,
const xmlChar * defaultValue, xmlEnumerationPtr tree)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
if (defaultValue == NULL)
fprintf(stdout, "SAX.attributeDecl(%s, %s, %d, %d, NULL, ...)\n",
elem, name, type, def);
else
fprintf(stdout, "SAX.attributeDecl(%s, %s, %d, %d, %s, ...)\n",
elem, name, type, def, defaultValue);
xmlFreeEnumeration(tree);
}
/**
* elementDeclDebug:
* @ctxt: An XML parser context
* @name: the element name
* @type: the element type
* @content: the element value (without processing).
*
* An element definition has been parsed
*/
static void
elementDeclDebug(void *ctx, const xmlChar *name, int type,
xmlElementContentPtr content ATTRIBUTE_UNUSED)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.elementDecl(%s, %d, ...)\n",
name, type);
}
/**
* notationDeclDebug:
* @ctxt: An XML parser context
* @name: The name of the notation
* @publicId: The public ID of the entity
* @systemId: The system ID of the entity
*
* What to do when a notation declaration has been parsed.
*/
static void
notationDeclDebug(void *ctx, const xmlChar *name,
const xmlChar *publicId, const xmlChar *systemId)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.notationDecl(%s, %s, %s)\n",
(char *) name, (char *) publicId, (char *) systemId);
}
/**
* unparsedEntityDeclDebug:
* @ctxt: An XML parser context
* @name: The name of the entity
* @publicId: The public ID of the entity
* @systemId: The system ID of the entity
* @notationName: the name of the notation
*
* What to do when an unparsed entity declaration is parsed
*/
static void
unparsedEntityDeclDebug(void *ctx, const xmlChar *name,
const xmlChar *publicId, const xmlChar *systemId,
const xmlChar *notationName)
{
xmllintState *lint = ctx;
const xmlChar *nullstr = BAD_CAST "(null)";
if (publicId == NULL)
publicId = nullstr;
if (systemId == NULL)
systemId = nullstr;
if (notationName == NULL)
notationName = nullstr;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.unparsedEntityDecl(%s, %s, %s, %s)\n",
(char *) name, (char *) publicId, (char *) systemId,
(char *) notationName);
}
/**
* setDocumentLocatorDebug:
* @ctxt: An XML parser context
* @loc: A SAX Locator
*
* Receive the document locator at startup, actually xmlDefaultSAXLocator
* Everything is available on the context, so this is useless in our case.
*/
static void
setDocumentLocatorDebug(void *ctx, xmlSAXLocatorPtr loc ATTRIBUTE_UNUSED)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.setDocumentLocator()\n");
}
/**
* startDocumentDebug:
* @ctxt: An XML parser context
*
* called when the document start being processed.
*/
static void
startDocumentDebug(void *ctx)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.startDocument()\n");
}
/**
* endDocumentDebug:
* @ctxt: An XML parser context
*
* called when the document end has been detected.
*/
static void
endDocumentDebug(void *ctx)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.endDocument()\n");
}
#ifdef LIBXML_SAX1_ENABLED
/**
* startElementDebug:
* @ctxt: An XML parser context
* @name: The element name
*
* called when an opening tag has been processed.
*/
static void
startElementDebug(void *ctx, const xmlChar *name, const xmlChar **atts)
{
xmllintState *lint = ctx;
int i;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.startElement(%s", (char *) name);
if (atts != NULL) {
for (i = 0;(atts[i] != NULL);i++) {
fprintf(stdout, ", %s='", atts[i++]);
if (atts[i] != NULL)
fprintf(stdout, "%s'", atts[i]);
}
}
fprintf(stdout, ")\n");
}
/**
* endElementDebug:
* @ctxt: An XML parser context
* @name: The element name
*
* called when the end of an element has been detected.
*/
static void
endElementDebug(void *ctx, const xmlChar *name)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.endElement(%s)\n", (char *) name);
}
#endif /* LIBXML_SAX1_ENABLED */
/**
* charactersDebug:
* @ctxt: An XML parser context
* @ch: a xmlChar string
* @len: the number of xmlChar
*
* receiving some chars from the parser.
* Question: how much at a time ???
*/
static void
charactersDebug(void *ctx, const xmlChar *ch, int len)
{
xmllintState *lint = ctx;
char out[40];
int i;
lint->callbacks++;
if (lint->noout)
return;
for (i = 0;(i<len) && (i < 30);i++)
out[i] = (char) ch[i];
out[i] = 0;
fprintf(stdout, "SAX.characters(%s, %d)\n", out, len);
}
/**
* referenceDebug:
* @ctxt: An XML parser context
* @name: The entity name
*
* called when an entity reference is detected.
*/
static void
referenceDebug(void *ctx, const xmlChar *name)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.reference(%s)\n", name);
}
/**
* ignorableWhitespaceDebug:
* @ctxt: An XML parser context
* @ch: a xmlChar string
* @start: the first char in the string
* @len: the number of xmlChar
*
* receiving some ignorable whitespaces from the parser.
* Question: how much at a time ???
*/
static void
ignorableWhitespaceDebug(void *ctx, const xmlChar *ch, int len)
{
xmllintState *lint = ctx;
char out[40];
int i;
lint->callbacks++;
if (lint->noout)
return;
for (i = 0;(i<len) && (i < 30);i++)
out[i] = ch[i];
out[i] = 0;
fprintf(stdout, "SAX.ignorableWhitespace(%s, %d)\n", out, len);
}
/**
* processingInstructionDebug:
* @ctxt: An XML parser context
* @target: the target name
* @data: the PI data's
* @len: the number of xmlChar
*
* A processing instruction has been parsed.
*/
static void
processingInstructionDebug(void *ctx, const xmlChar *target,
const xmlChar *data)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
if (data != NULL)
fprintf(stdout, "SAX.processingInstruction(%s, %s)\n",
(char *) target, (char *) data);
else
fprintf(stdout, "SAX.processingInstruction(%s, NULL)\n",
(char *) target);
}
/**
* cdataBlockDebug:
* @ctx: the user data (XML parser context)
* @value: The pcdata content
* @len: the block length
*
* called when a pcdata block has been parsed
*/
static void
cdataBlockDebug(void *ctx, const xmlChar *value, int len)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.pcdata(%.20s, %d)\n",
(char *) value, len);
}
/**
* commentDebug:
* @ctxt: An XML parser context
* @value: the comment content
*
* A comment has been parsed.
*/
static void
commentDebug(void *ctx, const xmlChar *value)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.comment(%s)\n", value);
}
/**
* warningDebug:
* @ctxt: An XML parser context
* @msg: the message to display/transmit
* @...: extra parameters for the message display
*
* Display and format a warning messages, gives file, line, position and
* extra parameters.
*/
2022-12-08 02:43:17 +01:00
static void LIBXML_ATTR_FORMAT(2,3)
warningDebug(void *ctx, const char *msg, ...)
{
xmllintState *lint = ctx;
va_list args;
lint->callbacks++;
if (lint->noout)
return;
va_start(args, msg);
fprintf(stdout, "SAX.warning: ");
vfprintf(stdout, msg, args);
va_end(args);
}
/**
* errorDebug:
* @ctxt: An XML parser context
* @msg: the message to display/transmit
* @...: extra parameters for the message display
*
* Display and format a error messages, gives file, line, position and
* extra parameters.
*/
2022-12-08 02:43:17 +01:00
static void LIBXML_ATTR_FORMAT(2,3)
errorDebug(void *ctx, const char *msg, ...)
{
xmllintState *lint = ctx;
va_list args;
lint->callbacks++;
if (lint->noout)
return;
va_start(args, msg);
fprintf(stdout, "SAX.error: ");
vfprintf(stdout, msg, args);
va_end(args);
}
/**
* fatalErrorDebug:
* @ctxt: An XML parser context
* @msg: the message to display/transmit
* @...: extra parameters for the message display
*
* Display and format a fatalError messages, gives file, line, position and
* extra parameters.
*/
2022-12-08 02:43:17 +01:00
static void LIBXML_ATTR_FORMAT(2,3)
fatalErrorDebug(void *ctx, const char *msg, ...)
{
xmllintState *lint = ctx;
va_list args;
lint->callbacks++;
if (lint->noout)
return;
va_start(args, msg);
fprintf(stdout, "SAX.fatalError: ");
vfprintf(stdout, msg, args);
va_end(args);
}
#ifdef LIBXML_SAX1_ENABLED
static const xmlSAXHandler debugSAXHandler = {
internalSubsetDebug,
isStandaloneDebug,
hasInternalSubsetDebug,
hasExternalSubsetDebug,
resolveEntityDebug,
getEntityDebug,
entityDeclDebug,
notationDeclDebug,
attributeDeclDebug,
elementDeclDebug,
unparsedEntityDeclDebug,
setDocumentLocatorDebug,
startDocumentDebug,
endDocumentDebug,
startElementDebug,
endElementDebug,
referenceDebug,
charactersDebug,
ignorableWhitespaceDebug,
processingInstructionDebug,
commentDebug,
warningDebug,
errorDebug,
fatalErrorDebug,
getParameterEntityDebug,
cdataBlockDebug,
externalSubsetDebug,
1,
NULL,
NULL,
NULL,
NULL
};
#endif
/*
* SAX2 specific callbacks
*/
/**
* startElementNsDebug:
* @ctxt: An XML parser context
* @name: The element name
*
* called when an opening tag has been processed.
*/
static void
startElementNsDebug(void *ctx,
const xmlChar *localname,
const xmlChar *prefix,
const xmlChar *URI,
int nb_namespaces,
const xmlChar **namespaces,
int nb_attributes,
int nb_defaulted,
const xmlChar **attributes)
{
xmllintState *lint = ctx;
int i;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.startElementNs(%s", (char *) localname);
if (prefix == NULL)
fprintf(stdout, ", NULL");
else
fprintf(stdout, ", %s", (char *) prefix);
if (URI == NULL)
fprintf(stdout, ", NULL");
else
fprintf(stdout, ", '%s'", (char *) URI);
fprintf(stdout, ", %d", nb_namespaces);
if (namespaces != NULL) {
for (i = 0;i < nb_namespaces * 2;i++) {
fprintf(stdout, ", xmlns");
if (namespaces[i] != NULL)
fprintf(stdout, ":%s", namespaces[i]);
i++;
fprintf(stdout, "='%s'", namespaces[i]);
}
}
fprintf(stdout, ", %d, %d", nb_attributes, nb_defaulted);
if (attributes != NULL) {
for (i = 0;i < nb_attributes * 5;i += 5) {
if (attributes[i + 1] != NULL)
fprintf(stdout, ", %s:%s='", attributes[i + 1], attributes[i]);
else
fprintf(stdout, ", %s='", attributes[i]);
fprintf(stdout, "%.4s...', %d", attributes[i + 3],
(int)(attributes[i + 4] - attributes[i + 3]));
}
}
fprintf(stdout, ")\n");
}
/**
* endElementDebug:
* @ctxt: An XML parser context
* @name: The element name
*
* called when the end of an element has been detected.
*/
static void
endElementNsDebug(void *ctx,
const xmlChar *localname,
const xmlChar *prefix,
const xmlChar *URI)
{
xmllintState *lint = ctx;
lint->callbacks++;
if (lint->noout)
return;
fprintf(stdout, "SAX.endElementNs(%s", (char *) localname);
if (prefix == NULL)
fprintf(stdout, ", NULL");
else
fprintf(stdout, ", %s", (char *) prefix);
if (URI == NULL)
fprintf(stdout, ", NULL)\n");
else
fprintf(stdout, ", '%s')\n", (char *) URI);
}
static const xmlSAXHandler debugSAX2Handler = {
internalSubsetDebug,
isStandaloneDebug,
hasInternalSubsetDebug,
hasExternalSubsetDebug,
resolveEntityDebug,
getEntityDebug,
entityDeclDebug,
notationDeclDebug,
attributeDeclDebug,
elementDeclDebug,
unparsedEntityDeclDebug,
setDocumentLocatorDebug,
startDocumentDebug,
endDocumentDebug,
NULL,
NULL,
referenceDebug,
charactersDebug,
ignorableWhitespaceDebug,
processingInstructionDebug,
commentDebug,
warningDebug,
errorDebug,
fatalErrorDebug,
getParameterEntityDebug,
cdataBlockDebug,
externalSubsetDebug,
XML_SAX2_MAGIC,
NULL,
startElementNsDebug,
endElementNsDebug,
NULL
};
static void
testSAX(xmllintState *lint, const char *filename) {
lint->callbacks = 0;
#ifdef LIBXML_SCHEMAS_ENABLED
if (lint->wxschemas != NULL) {
int ret;
xmlSchemaValidCtxtPtr vctxt;
xmlParserInputBufferPtr buf;
if (strcmp(filename, "-") == 0)
buf = xmlParserInputBufferCreateFd(STDIN_FILENO,
XML_CHAR_ENCODING_NONE);
else
buf = xmlParserInputBufferCreateFilename(filename,
XML_CHAR_ENCODING_NONE);
if (buf == NULL)
return;
vctxt = xmlSchemaNewValidCtxt(lint->wxschemas);
if (vctxt == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
xmlFreeParserInputBuffer(buf);
return;
}
xmlSchemaValidateSetFilename(vctxt, filename);
ret = xmlSchemaValidateStream(vctxt, buf, 0, lint->ctxt->sax, lint);
if (lint->repeat == 1) {
if (ret == 0) {
if (!lint->quiet) {
fprintf(lint->errStream, "%s validates\n", filename);
}
} else if (ret > 0) {
fprintf(lint->errStream, "%s fails to validate\n", filename);
lint->progresult = XMLLINT_ERR_VALID;
} else {
fprintf(lint->errStream, "%s validation generated an internal error\n",
filename);
lint->progresult = XMLLINT_ERR_VALID;
}
}
xmlSchemaFreeValidCtxt(vctxt);
} else
2024-09-27 22:54:14 +02:00
#endif
#ifdef LIBXML_HTML_ENABLED
if (lint->html) {
parseHtml(lint, filename);
2024-09-27 22:54:14 +02:00
} else
#endif
{
parseXml(lint, filename);
}
}
/************************************************************************
* *
* Stream Test processing *
* *
************************************************************************/
#ifdef LIBXML_READER_ENABLED
static void processNode(xmllintState *lint, xmlTextReaderPtr reader) {
const xmlChar *name, *value;
int type, empty;
type = xmlTextReaderNodeType(reader);
empty = xmlTextReaderIsEmptyElement(reader);
if (lint->debug) {
name = xmlTextReaderConstName(reader);
if (name == NULL)
name = BAD_CAST "--";
value = xmlTextReaderConstValue(reader);
printf("%d %d %s %d %d",
xmlTextReaderDepth(reader),
type,
name,
empty,
xmlTextReaderHasValue(reader));
if (value == NULL)
printf("\n");
else {
printf(" %s\n", value);
}
}
#ifdef LIBXML_PATTERN_ENABLED
if (lint->patternc) {
xmlChar *path = NULL;
int match = -1;
if (type == XML_READER_TYPE_ELEMENT) {
/* do the check only on element start */
match = xmlPatternMatch(lint->patternc,
xmlTextReaderCurrentNode(reader));
if (match) {
path = xmlGetNodePath(xmlTextReaderCurrentNode(reader));
printf("Node %s matches pattern %s\n", path, lint->pattern);
}
}
if (lint->patstream != NULL) {
int ret;
if (type == XML_READER_TYPE_ELEMENT) {
ret = xmlStreamPush(lint->patstream,
xmlTextReaderConstLocalName(reader),
xmlTextReaderConstNamespaceUri(reader));
if (ret < 0) {
fprintf(lint->errStream, "xmlStreamPush() failure\n");
xmlFreeStreamCtxt(lint->patstream);
lint->patstream = NULL;
} else if (ret != match) {
if (path == NULL) {
path = xmlGetNodePath(
xmlTextReaderCurrentNode(reader));
}
fprintf(lint->errStream,
"xmlPatternMatch and xmlStreamPush disagree\n");
if (path != NULL)
fprintf(lint->errStream, " pattern %s node %s\n",
lint->pattern, path);
else
fprintf(lint->errStream, " pattern %s node %s\n",
lint->pattern, xmlTextReaderConstName(reader));
}
}
if ((type == XML_READER_TYPE_END_ELEMENT) ||
((type == XML_READER_TYPE_ELEMENT) && (empty))) {
ret = xmlStreamPop(lint->patstream);
if (ret < 0) {
fprintf(lint->errStream, "xmlStreamPop() failure\n");
xmlFreeStreamCtxt(lint->patstream);
lint->patstream = NULL;
}
}
}
if (path != NULL)
xmlFree(path);
}
#endif
}
static void streamFile(xmllintState *lint, const char *filename) {
xmlParserInputBufferPtr input = NULL;
FILE *errStream = lint->errStream;
xmlTextReaderPtr reader;
int ret;
#if HAVE_DECL_MMAP
if (lint->memory) {
reader = xmlReaderForMemory(lint->memoryData, lint->memorySize,
filename, NULL, lint->options);
} else
#endif
{
if (strcmp(filename, "-") == 0) {
reader = xmlReaderForFd(STDIN_FILENO, "-", NULL, lint->options);
}
else {
/*
* There's still no easy way to get a reader for a file with
* adequate error repoting.
*/
xmlResetLastError();
input = xmlParserInputBufferCreateFilename(filename,
XML_CHAR_ENCODING_NONE);
if (input == NULL) {
const xmlError *error = xmlGetLastError();
if ((error != NULL) && (error->code == XML_ERR_NO_MEMORY)) {
lint->progresult = XMLLINT_ERR_MEM;
} else {
fprintf(errStream, "Unable to open %s\n", filename);
lint->progresult = XMLLINT_ERR_RDFILE;
}
return;
}
reader = xmlNewTextReader(input, filename);
if (reader == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
xmlFreeParserInputBuffer(input);
return;
}
if (xmlTextReaderSetup(reader, NULL, NULL, NULL,
lint->options) < 0) {
lint->progresult = XMLLINT_ERR_MEM;
xmlFreeParserInputBuffer(input);
return;
}
}
}
if (reader == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
return;
}
#ifdef LIBXML_PATTERN_ENABLED
if (lint->patternc != NULL) {
lint->patstream = xmlPatternGetStreamCtxt(lint->patternc);
if (lint->patstream != NULL) {
ret = xmlStreamPush(lint->patstream, NULL, NULL);
if (ret < 0) {
fprintf(errStream, "xmlStreamPush() failure\n");
xmlFreeStreamCtxt(lint->patstream);
lint->patstream = NULL;
}
}
}
#endif
xmlTextReaderSetResourceLoader(reader, xmllintResourceLoader, lint);
if (lint->maxAmpl > 0)
xmlTextReaderSetMaxAmplification(reader, lint->maxAmpl);
2024-06-11 18:14:43 +02:00
#ifdef LIBXML_RELAXNG_ENABLED
if (lint->relaxng != NULL) {
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
ret = xmlTextReaderRelaxNGValidate(reader, lint->relaxng);
if (ret < 0) {
fprintf(errStream, "Relax-NG schema %s failed to compile\n",
lint->relaxng);
lint->progresult = XMLLINT_ERR_SCHEMACOMP;
lint->relaxng = NULL;
}
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Compiling the schemas");
}
}
#endif
#ifdef LIBXML_SCHEMAS_ENABLED
if (lint->schema != NULL) {
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
ret = xmlTextReaderSchemaValidate(reader, lint->schema);
if (ret < 0) {
fprintf(errStream, "XSD schema %s failed to compile\n",
lint->schema);
lint->progresult = XMLLINT_ERR_SCHEMACOMP;
lint->schema = NULL;
}
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Compiling the schemas");
}
}
#endif
/*
* Process all nodes in sequence
*/
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
ret = xmlTextReaderRead(reader);
while (ret == 1) {
if ((lint->debug)
#ifdef LIBXML_PATTERN_ENABLED
|| (lint->patternc)
#endif
)
processNode(lint, reader);
ret = xmlTextReaderRead(reader);
}
if ((lint->timing) && (lint->repeat == 1)) {
#ifdef LIBXML_RELAXNG_ENABLED
if (lint->relaxng != NULL)
endTimer(lint, "Parsing and validating");
else
#endif
#ifdef LIBXML_VALID_ENABLED
if (lint->options & XML_PARSE_DTDVALID)
endTimer(lint, "Parsing and validating");
else
#endif
endTimer(lint, "Parsing");
}
#ifdef LIBXML_VALID_ENABLED
if (lint->options & XML_PARSE_DTDVALID) {
if (xmlTextReaderIsValid(reader) != 1) {
fprintf(errStream,
"Document %s does not validate\n", filename);
lint->progresult = XMLLINT_ERR_VALID;
}
}
#endif /* LIBXML_VALID_ENABLED */
#if defined(LIBXML_RELAXNG_ENABLED) || defined(LIBXML_SCHEMAS_ENABLED)
{
int hasSchema = 0;
#ifdef LIBXML_RELAXNG_ENABLED
if (lint->relaxng != NULL)
hasSchema = 1;
#endif
#ifdef LIBXML_SCHEMAS_ENABLED
if (lint->schema != NULL)
hasSchema = 1;
#endif
if (hasSchema) {
if (xmlTextReaderIsValid(reader) != 1) {
fprintf(errStream, "%s fails to validate\n", filename);
lint->progresult = XMLLINT_ERR_VALID;
} else {
if (!lint->quiet) {
fprintf(errStream, "%s validates\n", filename);
}
}
}
}
#endif
/*
* Done, cleanup and status
*/
xmlFreeTextReader(reader);
xmlFreeParserInputBuffer(input);
if (ret != 0) {
fprintf(errStream, "%s : failed to parse\n", filename);
lint->progresult = XMLLINT_ERR_UNCLASS;
}
#ifdef LIBXML_PATTERN_ENABLED
if (lint->patstream != NULL) {
xmlFreeStreamCtxt(lint->patstream);
lint->patstream = NULL;
}
#endif
}
static void walkDoc(xmllintState *lint, xmlDocPtr doc) {
FILE *errStream = lint->errStream;
xmlTextReaderPtr reader;
int ret;
#ifdef LIBXML_PATTERN_ENABLED
if (lint->pattern != NULL) {
2024-05-06 02:34:01 +02:00
xmlNodePtr root;
const xmlChar *namespaces[22];
int i;
xmlNsPtr ns;
root = xmlDocGetRootElement(doc);
if (root == NULL ) {
fprintf(errStream,
2024-05-06 02:34:01 +02:00
"Document does not have a root element");
lint->progresult = XMLLINT_ERR_UNCLASS;
2024-05-06 02:34:01 +02:00
return;
}
for (ns = root->nsDef, i = 0;ns != NULL && i < 20;ns=ns->next) {
namespaces[i++] = ns->href;
namespaces[i++] = ns->prefix;
}
namespaces[i++] = NULL;
namespaces[i] = NULL;
ret = xmlPatternCompileSafe((const xmlChar *) lint->pattern, doc->dict,
0, &namespaces[0], &lint->patternc);
if (lint->patternc == NULL) {
2024-05-06 02:34:01 +02:00
if (ret < 0) {
lint->progresult = XMLLINT_ERR_MEM;
2024-05-06 02:34:01 +02:00
} else {
fprintf(errStream, "Pattern %s failed to compile\n",
lint->pattern);
lint->progresult = XMLLINT_ERR_SCHEMAPAT;
}
2024-05-06 02:34:01 +02:00
goto error;
}
2024-05-06 02:34:01 +02:00
lint->patstream = xmlPatternGetStreamCtxt(lint->patternc);
if (lint->patstream == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
2024-05-06 02:34:01 +02:00
goto error;
}
ret = xmlStreamPush(lint->patstream, NULL, NULL);
2024-05-06 02:34:01 +02:00
if (ret < 0) {
fprintf(errStream, "xmlStreamPush() failure\n");
lint->progresult = XMLLINT_ERR_MEM;
2024-05-06 02:34:01 +02:00
goto error;
}
}
#endif /* LIBXML_PATTERN_ENABLED */
reader = xmlReaderWalker(doc);
if (reader != NULL) {
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
ret = xmlTextReaderRead(reader);
while (ret == 1) {
if ((lint->debug)
#ifdef LIBXML_PATTERN_ENABLED
|| (lint->patternc)
#endif
)
processNode(lint, reader);
ret = xmlTextReaderRead(reader);
}
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "walking through the doc");
}
xmlFreeTextReader(reader);
if (ret != 0) {
fprintf(errStream, "failed to walk through the doc\n");
lint->progresult = XMLLINT_ERR_UNCLASS;
}
} else {
fprintf(errStream, "Failed to create a reader from the document\n");
lint->progresult = XMLLINT_ERR_UNCLASS;
}
2024-05-06 02:34:01 +02:00
#ifdef LIBXML_PATTERN_ENABLED
2024-05-06 02:34:01 +02:00
error:
if (lint->patternc != NULL) {
xmlFreePattern(lint->patternc);
lint->patternc = NULL;
2024-05-06 02:34:01 +02:00
}
if (lint->patstream != NULL) {
xmlFreeStreamCtxt(lint->patstream);
lint->patstream = NULL;
}
#endif
}
#endif /* LIBXML_READER_ENABLED */
#ifdef LIBXML_XPATH_ENABLED
/************************************************************************
* *
* XPath Query *
* *
************************************************************************/
static void
doXPathDump(xmllintState *lint, xmlXPathObjectPtr cur) {
switch(cur->type) {
case XPATH_NODESET: {
#ifdef LIBXML_OUTPUT_ENABLED
xmlOutputBufferPtr buf;
xmlNodePtr node;
int i;
if ((cur->nodesetval == NULL) || (cur->nodesetval->nodeNr <= 0)) {
lint->progresult = XMLLINT_ERR_XPATH_EMPTY;
if (!lint->quiet) {
fprintf(lint->errStream, "XPath set is empty\n");
}
break;
}
buf = xmlOutputBufferCreateFile(stdout, NULL);
if (buf == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
return;
}
for (i = 0;i < cur->nodesetval->nodeNr;i++) {
node = cur->nodesetval->nodeTab[i];
xmlNodeDumpOutput(buf, NULL, node, 0, 0, NULL);
xmlOutputBufferWrite(buf, 1, "\n");
}
xmlOutputBufferClose(buf);
#else
printf("xpath returned %d nodes\n", cur->nodesetval->nodeNr);
#endif
break;
}
case XPATH_BOOLEAN:
if (cur->boolval) printf("true\n");
else printf("false\n");
break;
case XPATH_NUMBER:
switch (xmlXPathIsInf(cur->floatval)) {
case 1:
printf("Infinity\n");
break;
case -1:
printf("-Infinity\n");
break;
default:
if (xmlXPathIsNaN(cur->floatval)) {
printf("NaN\n");
} else {
printf("%0g\n", cur->floatval);
}
}
break;
case XPATH_STRING:
printf("%s\n", (const char *) cur->stringval);
break;
case XPATH_UNDEFINED:
fprintf(lint->errStream, "XPath Object is uninitialized\n");
lint->progresult = XMLLINT_ERR_XPATH;
break;
default:
fprintf(lint->errStream, "XPath object of unexpected type\n");
lint->progresult = XMLLINT_ERR_XPATH;
break;
}
}
static void
doXPathQuery(xmllintState *lint, xmlDocPtr doc, const char *query) {
xmlXPathContextPtr ctxt = NULL;
xmlXPathCompExprPtr comp = NULL;
xmlXPathObjectPtr res = NULL;
ctxt = xmlXPathNewContext(doc);
if (ctxt == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
goto error;
}
comp = xmlXPathCtxtCompile(ctxt, BAD_CAST query);
if (comp == NULL) {
fprintf(lint->errStream, "XPath compilation failure\n");
lint->progresult = XMLLINT_ERR_XPATH;
goto error;
}
#ifdef LIBXML_DEBUG_ENABLED
if (lint->debug) {
xmlXPathDebugDumpCompExpr(stdout, comp, 0);
printf("\n");
}
#endif
ctxt->node = (xmlNodePtr) doc;
res = xmlXPathCompiledEval(comp, ctxt);
if (res == NULL) {
fprintf(lint->errStream, "XPath evaluation failure\n");
lint->progresult = XMLLINT_ERR_XPATH;
goto error;
}
doXPathDump(lint, res);
error:
xmlXPathFreeObject(res);
xmlXPathFreeCompExpr(comp);
xmlXPathFreeContext(ctxt);
}
#endif /* LIBXML_XPATH_ENABLED */
/************************************************************************
* *
* Tree Test processing *
* *
************************************************************************/
static xmlDocPtr
parseFile(xmllintState *lint, const char *filename) {
xmlDocPtr doc = NULL;
if ((lint->generate) && (filename == NULL)) {
xmlNodePtr n;
doc = xmlNewDoc(BAD_CAST "1.0");
if (doc == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
return(NULL);
}
n = xmlNewDocNode(doc, NULL, BAD_CAST "info", NULL);
if (n == NULL) {
xmlFreeDoc(doc);
lint->progresult = XMLLINT_ERR_MEM;
return(NULL);
}
if (xmlNodeSetContent(n, BAD_CAST "abc") < 0) {
xmlFreeNode(n);
xmlFreeDoc(doc);
lint->progresult = XMLLINT_ERR_MEM;
return(NULL);
}
xmlDocSetRootElement(doc, n);
return(doc);
}
#ifdef LIBXML_HTML_ENABLED
if (lint->html) {
doc = parseHtml(lint, filename);
return(doc);
}
#endif /* LIBXML_HTML_ENABLED */
{
doc = parseXml(lint, filename);
}
if (doc == NULL) {
if (lint->ctxt->errNo == XML_ERR_NO_MEMORY)
lint->progresult = XMLLINT_ERR_MEM;
else
lint->progresult = XMLLINT_ERR_RDFILE;
} else {
#ifdef LIBXML_VALID_ENABLED
if ((lint->options & XML_PARSE_DTDVALID) && (lint->ctxt->valid == 0))
lint->progresult = XMLLINT_ERR_VALID;
#endif /* LIBXML_VALID_ENABLED */
}
return(doc);
}
static void
parseAndPrintFile(xmllintState *lint, const char *filename) {
FILE *errStream = lint->errStream;
xmlDocPtr doc;
/* Avoid unused variable warning */
(void) errStream;
if ((lint->timing) && (lint->repeat == 1))
startTimer(lint);
doc = parseFile(lint, filename);
if (doc == NULL) {
if (lint->progresult == XMLLINT_RETURN_OK)
lint->progresult = XMLLINT_ERR_UNCLASS;
return;
}
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Parsing");
}
if (lint->dropdtd) {
xmlDtdPtr dtd;
dtd = xmlGetIntSubset(doc);
if (dtd != NULL) {
xmlUnlinkNode((xmlNodePtr)dtd);
doc->intSubset = dtd;
}
}
#ifdef LIBXML_XINCLUDE_ENABLED
if (lint->xinclude) {
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
if (xmlXIncludeProcessFlags(doc, lint->options) < 0) {
lint->progresult = XMLLINT_ERR_UNCLASS;
goto done;
}
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Xinclude processing");
}
}
#endif
/*
* shell interaction
*/
if (lint->shell) {
#ifdef LIBXML_XPATH_ENABLED
xmlXPathOrderDocElems(doc);
#endif
xmllintShell(doc, filename, stdout);
goto done;
}
#ifdef LIBXML_XPATH_ENABLED
if (lint->xpathquery != NULL) {
xmlXPathOrderDocElems(doc);
doXPathQuery(lint, doc, lint->xpathquery);
}
#endif
/*
* test intermediate copy if needed.
*/
if (lint->copy) {
xmlDocPtr tmp;
tmp = doc;
if (lint->timing) {
startTimer(lint);
}
doc = xmlCopyDoc(doc, 1);
if (doc == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
xmlFreeDoc(tmp);
return;
}
if (lint->timing) {
endTimer(lint, "Copying");
}
if (lint->timing) {
startTimer(lint);
}
xmlFreeDoc(tmp);
if (lint->timing) {
endTimer(lint, "Freeing original");
}
}
#ifdef LIBXML_VALID_ENABLED
if ((lint->insert)
#ifdef LIBXML_HTML_ENABLED
&& (!lint->html)
#endif
) {
const xmlChar* list[256];
int nb, i;
xmlNodePtr node;
if (doc->children != NULL) {
node = doc->children;
while ((node != NULL) &&
((node->type != XML_ELEMENT_NODE) ||
(node->last == NULL)))
node = node->next;
if (node != NULL) {
nb = xmlValidGetValidElements(node->last, NULL, list, 256);
if (nb < 0) {
fprintf(errStream, "could not get valid list of elements\n");
} else if (nb == 0) {
fprintf(errStream, "No element can be inserted under root\n");
} else {
fprintf(errStream, "%d element types can be inserted under root:\n",
nb);
for (i = 0;i < nb;i++) {
fprintf(errStream, "%s\n", (char *) list[i]);
}
}
}
}
} else
#endif /* LIBXML_VALID_ENABLED */
#ifdef LIBXML_READER_ENABLED
if (lint->walker) {
walkDoc(lint, doc);
}
#endif /* LIBXML_READER_ENABLED */
#ifdef LIBXML_OUTPUT_ENABLED
if (lint->noout == 0) {
if (lint->compress)
2024-04-28 17:54:36 +02:00
xmlSetDocCompressMode(doc, 9);
/*
* print it.
*/
#ifdef LIBXML_DEBUG_ENABLED
if (!lint->debug) {
#endif
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
#ifdef LIBXML_HTML_ENABLED
if ((lint->html) && (!lint->xmlout)) {
if (lint->compress) {
htmlSaveFile(lint->output ? lint->output : "-", doc);
}
else if (lint->encoding != NULL) {
if (lint->format == 1) {
htmlSaveFileFormat(lint->output ? lint->output : "-",
doc, lint->encoding, 1);
}
else {
htmlSaveFileFormat(lint->output ? lint->output : "-",
doc, lint->encoding, 0);
}
}
else if (lint->format == 1) {
htmlSaveFileFormat(lint->output ? lint->output : "-",
doc, NULL, 1);
}
else {
FILE *out;
if (lint->output == NULL)
out = stdout;
else {
out = fopen(lint->output,"wb");
}
if (out != NULL) {
if (htmlDocDump(out, doc) < 0)
lint->progresult = XMLLINT_ERR_OUT;
if (lint->output != NULL)
fclose(out);
} else {
fprintf(errStream, "failed to open %s\n",
lint->output);
lint->progresult = XMLLINT_ERR_OUT;
}
}
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Saving");
}
} else
#endif
#ifdef LIBXML_C14N_ENABLED
if (lint->canonical) {
xmlChar *result = NULL;
int size;
size = xmlC14NDocDumpMemory(doc, NULL, XML_C14N_1_0, NULL, 1, &result);
if (size >= 0) {
if (write(1, result, size) == -1) {
fprintf(errStream, "Can't write data\n");
}
xmlFree(result);
} else {
fprintf(errStream, "Failed to canonicalize\n");
lint->progresult = XMLLINT_ERR_OUT;
}
} else if (lint->canonical_11) {
xmlChar *result = NULL;
int size;
size = xmlC14NDocDumpMemory(doc, NULL, XML_C14N_1_1, NULL, 1, &result);
if (size >= 0) {
if (write(1, result, size) == -1) {
fprintf(errStream, "Can't write data\n");
}
xmlFree(result);
} else {
fprintf(errStream, "Failed to canonicalize\n");
lint->progresult = XMLLINT_ERR_OUT;
}
} else if (lint->exc_canonical) {
xmlChar *result = NULL;
int size;
size = xmlC14NDocDumpMemory(doc, NULL, XML_C14N_EXCLUSIVE_1_0, NULL, 1, &result);
if (size >= 0) {
if (write(1, result, size) == -1) {
fprintf(errStream, "Can't write data\n");
}
xmlFree(result);
} else {
fprintf(errStream, "Failed to canonicalize\n");
lint->progresult = XMLLINT_ERR_OUT;
}
} else
#endif
#if HAVE_DECL_MMAP
if (lint->memory) {
xmlChar *result;
int len;
if (lint->encoding != NULL) {
if (lint->format == 1) {
xmlDocDumpFormatMemoryEnc(doc, &result, &len,
lint->encoding, 1);
} else {
xmlDocDumpMemoryEnc(doc, &result, &len,
lint->encoding);
}
} else {
if (lint->format == 1)
xmlDocDumpFormatMemory(doc, &result, &len, 1);
else
xmlDocDumpMemory(doc, &result, &len);
}
if (result == NULL) {
fprintf(errStream, "Failed to save\n");
lint->progresult = XMLLINT_ERR_OUT;
} else {
if (write(1, result, len) == -1) {
fprintf(errStream, "Can't write data\n");
}
xmlFree(result);
}
} else
#endif /* HAVE_DECL_MMAP */
if (lint->compress) {
xmlSaveFile(lint->output ? lint->output : "-", doc);
} else {
xmlSaveCtxtPtr ctxt;
int saveOpts = 0;
if (lint->format == 1)
saveOpts |= XML_SAVE_FORMAT;
else if (lint->format == 2)
saveOpts |= XML_SAVE_WSNONSIG;
#if defined(LIBXML_HTML_ENABLED)
if (lint->xmlout)
saveOpts |= XML_SAVE_AS_XML;
#endif
if (lint->output == NULL)
ctxt = xmlSaveToFd(STDOUT_FILENO, lint->encoding,
saveOpts);
else
ctxt = xmlSaveToFilename(lint->output, lint->encoding,
saveOpts);
if (ctxt != NULL) {
if (xmlSaveDoc(ctxt, doc) < 0) {
fprintf(errStream, "failed save to %s\n",
lint->output ? lint->output : "-");
lint->progresult = XMLLINT_ERR_OUT;
}
xmlSaveClose(ctxt);
} else {
lint->progresult = XMLLINT_ERR_OUT;
}
}
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Saving");
}
#ifdef LIBXML_DEBUG_ENABLED
} else {
FILE *out;
if (lint->output == NULL)
out = stdout;
else {
out = fopen(lint->output, "wb");
}
if (out != NULL) {
xmlDebugDumpDocument(out, doc);
if (lint->output != NULL)
fclose(out);
} else {
fprintf(errStream, "failed to open %s\n", lint->output);
lint->progresult = XMLLINT_ERR_OUT;
}
}
#endif
}
#endif /* LIBXML_OUTPUT_ENABLED */
#ifdef LIBXML_VALID_ENABLED
/*
* A posteriori validation test
*/
if ((lint->dtdvalid != NULL) || (lint->dtdvalidfpi != NULL)) {
xmlDtdPtr dtd;
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
if (lint->dtdvalid != NULL)
dtd = xmlParseDTD(NULL, BAD_CAST lint->dtdvalid);
else
dtd = xmlParseDTD(BAD_CAST lint->dtdvalidfpi, NULL);
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Parsing DTD");
}
if (dtd == NULL) {
if (lint->dtdvalid != NULL)
fprintf(errStream, "Could not parse DTD %s\n",
lint->dtdvalid);
else
fprintf(errStream, "Could not parse DTD %s\n",
lint->dtdvalidfpi);
lint->progresult = XMLLINT_ERR_DTD;
} else {
xmlValidCtxtPtr cvp;
cvp = xmlNewValidCtxt();
if (cvp == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
xmlFreeDtd(dtd);
return;
}
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
if (!xmlValidateDtd(cvp, doc, dtd)) {
if (lint->dtdvalid != NULL)
fprintf(errStream,
"Document %s does not validate against %s\n",
filename, lint->dtdvalid);
else
fprintf(errStream,
"Document %s does not validate against %s\n",
filename, lint->dtdvalidfpi);
lint->progresult = XMLLINT_ERR_VALID;
}
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Validating against DTD");
}
xmlFreeValidCtxt(cvp);
xmlFreeDtd(dtd);
}
} else if (lint->postvalid) {
xmlValidCtxtPtr cvp;
cvp = xmlNewValidCtxt();
if (cvp == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
xmlFreeDoc(doc);
return;
}
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
if (!xmlValidateDocument(cvp, doc)) {
fprintf(errStream,
"Document %s does not validate\n", filename);
lint->progresult = XMLLINT_ERR_VALID;
}
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Validating");
}
xmlFreeValidCtxt(cvp);
}
#endif /* LIBXML_VALID_ENABLED */
#ifdef LIBXML_SCHEMATRON_ENABLED
if (lint->wxschematron != NULL) {
xmlSchematronValidCtxtPtr ctxt;
int ret;
int flag;
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
if (lint->debug)
flag = XML_SCHEMATRON_OUT_XML;
else
flag = XML_SCHEMATRON_OUT_TEXT;
if (lint->noout)
flag |= XML_SCHEMATRON_OUT_QUIET;
ctxt = xmlSchematronNewValidCtxt(lint->wxschematron, flag);
if (ctxt == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
xmlFreeDoc(doc);
return;
}
ret = xmlSchematronValidateDoc(ctxt, doc);
if (ret == 0) {
if (!lint->quiet) {
fprintf(errStream, "%s validates\n", filename);
}
} else if (ret > 0) {
fprintf(errStream, "%s fails to validate\n", filename);
lint->progresult = XMLLINT_ERR_VALID;
} else {
fprintf(errStream, "%s validation generated an internal error\n",
filename);
lint->progresult = XMLLINT_ERR_VALID;
}
xmlSchematronFreeValidCtxt(ctxt);
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Validating");
}
}
#endif
#ifdef LIBXML_RELAXNG_ENABLED
if (lint->relaxngschemas != NULL) {
xmlRelaxNGValidCtxtPtr ctxt;
int ret;
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
ctxt = xmlRelaxNGNewValidCtxt(lint->relaxngschemas);
if (ctxt == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
xmlFreeDoc(doc);
return;
}
ret = xmlRelaxNGValidateDoc(ctxt, doc);
if (ret == 0) {
if (!lint->quiet) {
fprintf(errStream, "%s validates\n", filename);
}
} else if (ret > 0) {
fprintf(errStream, "%s fails to validate\n", filename);
lint->progresult = XMLLINT_ERR_VALID;
} else {
fprintf(errStream, "%s validation generated an internal error\n",
filename);
lint->progresult = XMLLINT_ERR_VALID;
}
xmlRelaxNGFreeValidCtxt(ctxt);
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Validating");
}
}
#endif /* LIBXML_RELAXNG_ENABLED */
#ifdef LIBXML_SCHEMAS_ENABLED
if (lint->wxschemas != NULL) {
xmlSchemaValidCtxtPtr ctxt;
int ret;
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
ctxt = xmlSchemaNewValidCtxt(lint->wxschemas);
if (ctxt == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
xmlFreeDoc(doc);
return;
}
ret = xmlSchemaValidateDoc(ctxt, doc);
if (ret == 0) {
if (!lint->quiet) {
fprintf(errStream, "%s validates\n", filename);
}
} else if (ret > 0) {
fprintf(errStream, "%s fails to validate\n", filename);
lint->progresult = XMLLINT_ERR_VALID;
} else {
fprintf(errStream, "%s validation generated an internal error\n",
filename);
lint->progresult = XMLLINT_ERR_VALID;
}
xmlSchemaFreeValidCtxt(ctxt);
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Validating");
}
}
#endif /* LIBXML_SCHEMAS_ENABLED */
#ifdef LIBXML_DEBUG_ENABLED
if ((lint->debugent)
#if defined(LIBXML_HTML_ENABLED)
&& (!lint->html)
#endif
)
xmlDebugDumpEntities(errStream, doc);
#endif
2025-01-17 13:04:35 +01:00
/* Avoid unused label warning */
goto done;
done:
/*
* free it.
*/
if ((lint->timing) && (lint->repeat == 1)) {
startTimer(lint);
}
xmlFreeDoc(doc);
if ((lint->timing) && (lint->repeat == 1)) {
endTimer(lint, "Freeing");
}
}
/************************************************************************
* *
* Usage and Main *
* *
************************************************************************/
static void showVersion(FILE *errStream, const char *name) {
fprintf(errStream, "%s: using libxml version %s\n", name, xmlParserVersion);
fprintf(errStream, " compiled with: ");
if (xmlHasFeature(XML_WITH_THREAD)) fprintf(errStream, "Threads ");
if (xmlHasFeature(XML_WITH_TREE)) fprintf(errStream, "Tree ");
if (xmlHasFeature(XML_WITH_OUTPUT)) fprintf(errStream, "Output ");
if (xmlHasFeature(XML_WITH_PUSH)) fprintf(errStream, "Push ");
if (xmlHasFeature(XML_WITH_READER)) fprintf(errStream, "Reader ");
if (xmlHasFeature(XML_WITH_PATTERN)) fprintf(errStream, "Patterns ");
if (xmlHasFeature(XML_WITH_WRITER)) fprintf(errStream, "Writer ");
if (xmlHasFeature(XML_WITH_SAX1)) fprintf(errStream, "SAXv1 ");
if (xmlHasFeature(XML_WITH_HTTP)) fprintf(errStream, "HTTP ");
if (xmlHasFeature(XML_WITH_VALID)) fprintf(errStream, "DTDValid ");
if (xmlHasFeature(XML_WITH_HTML)) fprintf(errStream, "HTML ");
if (xmlHasFeature(XML_WITH_LEGACY)) fprintf(errStream, "Legacy ");
if (xmlHasFeature(XML_WITH_C14N)) fprintf(errStream, "C14N ");
if (xmlHasFeature(XML_WITH_CATALOG)) fprintf(errStream, "Catalog ");
if (xmlHasFeature(XML_WITH_XPATH)) fprintf(errStream, "XPath ");
if (xmlHasFeature(XML_WITH_XPTR)) fprintf(errStream, "XPointer ");
if (xmlHasFeature(XML_WITH_XINCLUDE)) fprintf(errStream, "XInclude ");
if (xmlHasFeature(XML_WITH_ICONV)) fprintf(errStream, "Iconv ");
if (xmlHasFeature(XML_WITH_ICU)) fprintf(errStream, "ICU ");
if (xmlHasFeature(XML_WITH_ISO8859X)) fprintf(errStream, "ISO8859X ");
if (xmlHasFeature(XML_WITH_UNICODE)) fprintf(errStream, "Unicode ");
if (xmlHasFeature(XML_WITH_REGEXP)) fprintf(errStream, "Regexps ");
if (xmlHasFeature(XML_WITH_AUTOMATA)) fprintf(errStream, "Automata ");
if (xmlHasFeature(XML_WITH_EXPR)) fprintf(errStream, "Expr ");
if (xmlHasFeature(XML_WITH_RELAXNG)) fprintf(errStream, "RelaxNG ");
if (xmlHasFeature(XML_WITH_SCHEMAS)) fprintf(errStream, "Schemas ");
if (xmlHasFeature(XML_WITH_SCHEMATRON)) fprintf(errStream, "Schematron ");
if (xmlHasFeature(XML_WITH_MODULES)) fprintf(errStream, "Modules ");
if (xmlHasFeature(XML_WITH_DEBUG)) fprintf(errStream, "Debug ");
if (xmlHasFeature(XML_WITH_ZLIB)) fprintf(errStream, "Zlib ");
if (xmlHasFeature(XML_WITH_LZMA)) fprintf(errStream, "Lzma ");
fprintf(errStream, "\n");
}
static void usage(FILE *f, const char *name) {
fprintf(f, "Usage : %s [options] XMLfiles ...\n", name);
#ifdef LIBXML_OUTPUT_ENABLED
fprintf(f, "\tParse the XML files and output the result of the parsing\n");
#else
fprintf(f, "\tParse the XML files\n");
#endif /* LIBXML_OUTPUT_ENABLED */
fprintf(f, "\t--version : display the version of the XML library used\n");
fprintf(f, "\t--shell : run a navigating shell\n");
#ifdef LIBXML_DEBUG_ENABLED
fprintf(f, "\t--debug : dump a debug tree of the in-memory document\n");
fprintf(f, "\t--debugent : debug the entities defined in the document\n");
#else
#ifdef LIBXML_READER_ENABLED
fprintf(f, "\t--debug : dump the nodes content when using --stream\n");
#endif /* LIBXML_READER_ENABLED */
#endif
fprintf(f, "\t--copy : used to test the internal copy implementation\n");
fprintf(f, "\t--recover : output what was parsable on broken XML documents\n");
fprintf(f, "\t--huge : remove any internal arbitrary parser limits\n");
fprintf(f, "\t--noent : substitute entity references by their value\n");
fprintf(f, "\t--noenc : ignore any encoding specified inside the document\n");
fprintf(f, "\t--noout : don't output the result tree\n");
fprintf(f, "\t--path 'paths': provide a set of paths for resources\n");
fprintf(f, "\t--load-trace : print trace of all external entities loaded\n");
fprintf(f, "\t--nonet : refuse to fetch DTDs or entities over network\n");
fprintf(f, "\t--nocompact : do not generate compact text nodes\n");
fprintf(f, "\t--htmlout : output results as HTML\n");
fprintf(f, "\t--nowrap : do not put HTML doc wrapper\n");
#ifdef LIBXML_VALID_ENABLED
fprintf(f, "\t--valid : validate the document in addition to std well-formed check\n");
fprintf(f, "\t--postvalid : do a posteriori validation, i.e after parsing\n");
fprintf(f, "\t--dtdvalid URL : do a posteriori validation against a given DTD\n");
fprintf(f, "\t--dtdvalidfpi FPI : same but name the DTD with a Public Identifier\n");
fprintf(f, "\t--insert : ad-hoc test for valid insertions\n");
#endif /* LIBXML_VALID_ENABLED */
fprintf(f, "\t--quiet : be quiet when succeeded\n");
fprintf(f, "\t--timing : print some timings\n");
fprintf(f, "\t--repeat : repeat 100 times, for timing or profiling\n");
fprintf(f, "\t--dropdtd : remove the DOCTYPE of the input docs\n");
#ifdef LIBXML_HTML_ENABLED
fprintf(f, "\t--html : use the HTML parser\n");
fprintf(f, "\t--xmlout : force to use the XML serializer when using --html\n");
fprintf(f, "\t--nodefdtd : do not default HTML doctype\n");
#endif
#ifdef LIBXML_PUSH_ENABLED
fprintf(f, "\t--push : use the push mode of the parser\n");
#endif /* LIBXML_PUSH_ENABLED */
#if HAVE_DECL_MMAP
fprintf(f, "\t--memory : parse from memory\n");
#endif
fprintf(f, "\t--maxmem nbbytes : limits memory allocation to nbbytes bytes\n");
fprintf(f, "\t--nowarning : do not emit warnings from parser/validator\n");
fprintf(f, "\t--noblanks : drop (ignorable?) blanks spaces\n");
fprintf(f, "\t--nocdata : replace cdata section with text nodes\n");
fprintf(f, "\t--nodict : create document without dictionary\n");
fprintf(f, "\t--pedantic : enable additional warnings\n");
#ifdef LIBXML_OUTPUT_ENABLED
fprintf(f, "\t--output file or -o file: save to a given file\n");
fprintf(f, "\t--format : reformat/reindent the output\n");
fprintf(f, "\t--encode encoding : output in the given encoding\n");
fprintf(f, "\t--pretty STYLE : pretty-print in a particular style\n");
fprintf(f, "\t 0 Do not pretty print\n");
fprintf(f, "\t 1 Format the XML content, as --format\n");
fprintf(f, "\t 2 Add whitespace inside tags, preserving content\n");
#ifdef LIBXML_ZLIB_ENABLED
fprintf(f, "\t--compress : turn on gzip compression of output\n");
#endif
#endif /* LIBXML_OUTPUT_ENABLED */
fprintf(f, "\t--c14n : save in W3C canonical format v1.0 (with comments)\n");
fprintf(f, "\t--c14n11 : save in W3C canonical format v1.1 (with comments)\n");
fprintf(f, "\t--exc-c14n : save in W3C exclusive canonical format (with comments)\n");
#ifdef LIBXML_C14N_ENABLED
#endif /* LIBXML_C14N_ENABLED */
fprintf(f, "\t--nsclean : remove redundant namespace declarations\n");
fprintf(f, "\t--testIO : test user I/O support\n");
#ifdef LIBXML_CATALOG_ENABLED
fprintf(f, "\t--catalogs : use SGML catalogs from $SGML_CATALOG_FILES\n");
fprintf(f, "\t otherwise XML Catalogs starting from \n");
fprintf(f, "\t file://" XML_SYSCONFDIR "/xml/catalog "
"are activated by default\n");
fprintf(f, "\t--nocatalogs: deactivate all catalogs\n");
#endif
fprintf(f, "\t--auto : generate a small doc on the fly\n");
#ifdef LIBXML_XINCLUDE_ENABLED
fprintf(f, "\t--xinclude : do XInclude processing\n");
fprintf(f, "\t--noxincludenode : same but do not generate XInclude nodes\n");
fprintf(f, "\t--nofixup-base-uris : do not fixup xml:base uris\n");
#endif
fprintf(f, "\t--loaddtd : fetch external DTD\n");
fprintf(f, "\t--dtdattr : loaddtd + populate the tree with inherited attributes \n");
#ifdef LIBXML_READER_ENABLED
fprintf(f, "\t--stream : use the streaming interface to process very large files\n");
fprintf(f, "\t--walker : create a reader and walk though the resulting doc\n");
#ifdef LIBXML_PATTERN_ENABLED
fprintf(f, "\t--pattern pattern_value : test the pattern support\n");
#endif
#endif /* LIBXML_READER_ENABLED */
#ifdef LIBXML_RELAXNG_ENABLED
fprintf(f, "\t--relaxng schema : do RelaxNG validation against the schema\n");
#endif
#ifdef LIBXML_SCHEMAS_ENABLED
fprintf(f, "\t--schema schema : do validation against the WXS schema\n");
#endif
#ifdef LIBXML_SCHEMATRON_ENABLED
fprintf(f, "\t--schematron schema : do validation against a schematron\n");
#endif
#ifdef LIBXML_SAX1_ENABLED
fprintf(f, "\t--sax1: use the old SAX1 interfaces for processing\n");
#endif
fprintf(f, "\t--sax: do not build a tree but work just at the SAX level\n");
fprintf(f, "\t--oldxml10: use XML-1.0 parsing rules before the 5th edition\n");
#ifdef LIBXML_XPATH_ENABLED
fprintf(f, "\t--xpath expr: evaluate the XPath expression, imply --noout\n");
#endif
fprintf(f, "\t--max-ampl value: set maximum amplification factor\n");
fprintf(f, "\nLibxml project home page: https://gitlab.gnome.org/GNOME/libxml2\n");
}
static unsigned long
parseInteger(FILE *errStream, const char *ctxt, const char *str,
unsigned long min, unsigned long max) {
char *strEnd;
unsigned long val;
errno = 0;
val = strtoul(str, &strEnd, 10);
if (errno == EINVAL || *strEnd != 0) {
fprintf(errStream, "%s: invalid integer: %s\n", ctxt, str);
exit(XMLLINT_ERR_UNCLASS);
}
if (errno != 0 || val < min || val > max) {
fprintf(errStream, "%s: integer out of range: %s\n", ctxt, str);
exit(XMLLINT_ERR_UNCLASS);
}
return(val);
}
static int
skipArgs(const char *arg) {
if ((!strcmp(arg, "-path")) ||
(!strcmp(arg, "--path")) ||
(!strcmp(arg, "-maxmem")) ||
(!strcmp(arg, "--maxmem")) ||
#ifdef LIBXML_OUTPUT_ENABLED
(!strcmp(arg, "-o")) ||
(!strcmp(arg, "-output")) ||
(!strcmp(arg, "--output")) ||
(!strcmp(arg, "-encode")) ||
(!strcmp(arg, "--encode")) ||
(!strcmp(arg, "-pretty")) ||
(!strcmp(arg, "--pretty")) ||
#endif
#ifdef LIBXML_VALID_ENABLED
(!strcmp(arg, "-dtdvalid")) ||
(!strcmp(arg, "--dtdvalid")) ||
(!strcmp(arg, "-dtdvalidfpi")) ||
(!strcmp(arg, "--dtdvalidfpi")) ||
#endif
#ifdef LIBXML_RELAXNG_ENABLED
(!strcmp(arg, "-relaxng")) ||
(!strcmp(arg, "--relaxng")) ||
#endif
#ifdef LIBXML_SCHEMAS_ENABLED
(!strcmp(arg, "-schema")) ||
(!strcmp(arg, "--schema")) ||
#endif
#ifdef LIBXML_SCHEMATRON_ENABLED
(!strcmp(arg, "-schematron")) ||
(!strcmp(arg, "--schematron")) ||
#endif
#if defined(LIBXML_READER_ENABLED) && defined(LIBXML_PATTERN_ENABLED)
(!strcmp(arg, "-pattern")) ||
(!strcmp(arg, "--pattern")) ||
#endif
#ifdef LIBXML_XPATH_ENABLED
(!strcmp(arg, "-xpath")) ||
(!strcmp(arg, "--xpath")) ||
#endif
(!strcmp(arg, "-max-ampl")) ||
(!strcmp(arg, "--max-ampl"))
) {
return(1);
}
return(0);
}
static void
xmllintInit(xmllintState *lint) {
memset(lint, 0, sizeof(*lint));
2024-06-11 18:14:43 +02:00
lint->repeat = 1;
lint->progresult = XMLLINT_RETURN_OK;
lint->options = XML_PARSE_COMPACT | XML_PARSE_BIG_LINES;
}
2024-05-13 12:18:08 +02:00
static int
xmllintParseOptions(xmllintState *lint, int argc, const char **argv) {
FILE *errStream = lint->errStream;
int i;
if (argc <= 1) {
usage(errStream, argv[0]);
return(XMLLINT_ERR_UNCLASS);
}
for (i = 1; i < argc ; i++) {
if (argv[i][0] != '-' || argv[i][1] == 0)
continue;
if ((!strcmp(argv[i], "-maxmem")) ||
(!strcmp(argv[i], "--maxmem"))) {
i++;
if (i >= argc) {
fprintf(errStream, "maxmem: missing integer value\n");
return(XMLLINT_ERR_UNCLASS);
}
errno = 0;
lint->maxmem = parseInteger(errStream, "maxmem", argv[i],
0, INT_MAX);
} else if ((!strcmp(argv[i], "-debug")) ||
(!strcmp(argv[i], "--debug"))) {
lint->debug = 1;
} else if ((!strcmp(argv[i], "-shell")) ||
(!strcmp(argv[i], "--shell"))) {
lint->shell = 1;
} else if ((!strcmp(argv[i], "-copy")) ||
(!strcmp(argv[i], "--copy"))) {
lint->copy = 1;
} else if ((!strcmp(argv[i], "-recover")) ||
(!strcmp(argv[i], "--recover"))) {
lint->options |= XML_PARSE_RECOVER;
} else if ((!strcmp(argv[i], "-huge")) ||
(!strcmp(argv[i], "--huge"))) {
lint->options |= XML_PARSE_HUGE;
} else if ((!strcmp(argv[i], "-noent")) ||
(!strcmp(argv[i], "--noent"))) {
lint->options |= XML_PARSE_NOENT;
} else if ((!strcmp(argv[i], "-noenc")) ||
(!strcmp(argv[i], "--noenc"))) {
lint->options |= XML_PARSE_IGNORE_ENC;
} else if ((!strcmp(argv[i], "-nsclean")) ||
(!strcmp(argv[i], "--nsclean"))) {
lint->options |= XML_PARSE_NSCLEAN;
} else if ((!strcmp(argv[i], "-nocdata")) ||
(!strcmp(argv[i], "--nocdata"))) {
lint->options |= XML_PARSE_NOCDATA;
} else if ((!strcmp(argv[i], "-nodict")) ||
(!strcmp(argv[i], "--nodict"))) {
lint->options |= XML_PARSE_NODICT;
} else if ((!strcmp(argv[i], "-version")) ||
(!strcmp(argv[i], "--version"))) {
showVersion(errStream, argv[0]);
lint->version = 1;
} else if ((!strcmp(argv[i], "-noout")) ||
(!strcmp(argv[i], "--noout"))) {
lint->noout = 1;
} else if ((!strcmp(argv[i], "-htmlout")) ||
(!strcmp(argv[i], "--htmlout"))) {
lint->htmlout = 1;
} else if ((!strcmp(argv[i], "-nowrap")) ||
(!strcmp(argv[i], "--nowrap"))) {
lint->nowrap = 1;
#ifdef LIBXML_HTML_ENABLED
} else if ((!strcmp(argv[i], "-html")) ||
(!strcmp(argv[i], "--html"))) {
lint->html = 1;
} else if ((!strcmp(argv[i], "-xmlout")) ||
(!strcmp(argv[i], "--xmlout"))) {
lint->xmlout = 1;
} else if ((!strcmp(argv[i], "-nodefdtd")) ||
(!strcmp(argv[i], "--nodefdtd"))) {
lint->options |= HTML_PARSE_NODEFDTD;
#endif /* LIBXML_HTML_ENABLED */
} else if ((!strcmp(argv[i], "-loaddtd")) ||
(!strcmp(argv[i], "--loaddtd"))) {
lint->options |= XML_PARSE_DTDLOAD;
} else if ((!strcmp(argv[i], "-dtdattr")) ||
(!strcmp(argv[i], "--dtdattr"))) {
lint->options |= XML_PARSE_DTDATTR;
#ifdef LIBXML_VALID_ENABLED
} else if ((!strcmp(argv[i], "-valid")) ||
(!strcmp(argv[i], "--valid"))) {
lint->options |= XML_PARSE_DTDVALID;
} else if ((!strcmp(argv[i], "-postvalid")) ||
(!strcmp(argv[i], "--postvalid"))) {
lint->postvalid = 1;
lint->options |= XML_PARSE_DTDLOAD;
} else if ((!strcmp(argv[i], "-dtdvalid")) ||
(!strcmp(argv[i], "--dtdvalid"))) {
i++;
lint->dtdvalid = argv[i];
lint->options |= XML_PARSE_DTDLOAD;
} else if ((!strcmp(argv[i], "-dtdvalidfpi")) ||
(!strcmp(argv[i], "--dtdvalidfpi"))) {
i++;
lint->dtdvalidfpi = argv[i];
lint->options |= XML_PARSE_DTDLOAD;
} else if ((!strcmp(argv[i], "-insert")) ||
(!strcmp(argv[i], "--insert"))) {
lint->insert = 1;
#endif /* LIBXML_VALID_ENABLED */
} else if ((!strcmp(argv[i], "-dropdtd")) ||
(!strcmp(argv[i], "--dropdtd"))) {
lint->dropdtd = 1;
} else if ((!strcmp(argv[i], "-quiet")) ||
(!strcmp(argv[i], "--quiet"))) {
lint->quiet = 1;
} else if ((!strcmp(argv[i], "-timing")) ||
(!strcmp(argv[i], "--timing"))) {
lint->timing = 1;
} else if ((!strcmp(argv[i], "-auto")) ||
(!strcmp(argv[i], "--auto"))) {
lint->generate = 1;
} else if ((!strcmp(argv[i], "-repeat")) ||
(!strcmp(argv[i], "--repeat"))) {
#ifdef FUZZING_BUILD_MODE_UNSAFE_FOR_PRODUCTION
lint->repeat = 2;
#else
if (lint->repeat > 1)
lint->repeat *= 10;
else
lint->repeat = 100;
#endif
#ifdef LIBXML_PUSH_ENABLED
} else if ((!strcmp(argv[i], "-push")) ||
(!strcmp(argv[i], "--push"))) {
lint->push = 1;
#endif /* LIBXML_PUSH_ENABLED */
#if HAVE_DECL_MMAP
} else if ((!strcmp(argv[i], "-memory")) ||
(!strcmp(argv[i], "--memory"))) {
lint->memory = 1;
#endif
} else if ((!strcmp(argv[i], "-testIO")) ||
(!strcmp(argv[i], "--testIO"))) {
lint->testIO = 1;
#ifdef LIBXML_XINCLUDE_ENABLED
} else if ((!strcmp(argv[i], "-xinclude")) ||
(!strcmp(argv[i], "--xinclude"))) {
lint->xinclude = 1;
lint->options |= XML_PARSE_XINCLUDE;
} else if ((!strcmp(argv[i], "-noxincludenode")) ||
(!strcmp(argv[i], "--noxincludenode"))) {
lint->xinclude = 1;
lint->options |= XML_PARSE_XINCLUDE;
lint->options |= XML_PARSE_NOXINCNODE;
} else if ((!strcmp(argv[i], "-nofixup-base-uris")) ||
(!strcmp(argv[i], "--nofixup-base-uris"))) {
lint->xinclude = 1;
lint->options |= XML_PARSE_XINCLUDE;
lint->options |= XML_PARSE_NOBASEFIX;
#endif
} else if ((!strcmp(argv[i], "-nowarning")) ||
(!strcmp(argv[i], "--nowarning"))) {
lint->options |= XML_PARSE_NOWARNING;
lint->options &= ~XML_PARSE_PEDANTIC;
} else if ((!strcmp(argv[i], "-pedantic")) ||
(!strcmp(argv[i], "--pedantic"))) {
lint->options |= XML_PARSE_PEDANTIC;
lint->options &= ~XML_PARSE_NOWARNING;
2000-09-22 16:07:02 +00:00
#ifdef LIBXML_DEBUG_ENABLED
} else if ((!strcmp(argv[i], "-debugent")) ||
(!strcmp(argv[i], "--debugent"))) {
lint->debugent = 1;
#endif
#ifdef LIBXML_C14N_ENABLED
} else if ((!strcmp(argv[i], "-c14n")) ||
(!strcmp(argv[i], "--c14n"))) {
lint->canonical = 1;
lint->options |= XML_PARSE_NOENT | XML_PARSE_DTDATTR | XML_PARSE_DTDLOAD;
} else if ((!strcmp(argv[i], "-c14n11")) ||
(!strcmp(argv[i], "--c14n11"))) {
lint->canonical_11 = 1;
lint->options |= XML_PARSE_NOENT | XML_PARSE_DTDATTR | XML_PARSE_DTDLOAD;
} else if ((!strcmp(argv[i], "-exc-c14n")) ||
(!strcmp(argv[i], "--exc-c14n"))) {
lint->exc_canonical = 1;
lint->options |= XML_PARSE_NOENT | XML_PARSE_DTDATTR | XML_PARSE_DTDLOAD;
#endif
#ifdef LIBXML_CATALOG_ENABLED
} else if ((!strcmp(argv[i], "-catalogs")) ||
(!strcmp(argv[i], "--catalogs"))) {
lint->catalogs = 1;
} else if ((!strcmp(argv[i], "-nocatalogs")) ||
(!strcmp(argv[i], "--nocatalogs"))) {
lint->nocatalogs = 1;
#endif
} else if ((!strcmp(argv[i], "-noblanks")) ||
(!strcmp(argv[i], "--noblanks"))) {
lint->options |= XML_PARSE_NOBLANKS;
#ifdef LIBXML_OUTPUT_ENABLED
} else if ((!strcmp(argv[i], "-o")) ||
(!strcmp(argv[i], "-output")) ||
(!strcmp(argv[i], "--output"))) {
i++;
lint->output = argv[i];
} else if ((!strcmp(argv[i], "-format")) ||
(!strcmp(argv[i], "--format"))) {
lint->format = 1;
lint->options |= XML_PARSE_NOBLANKS;
} else if ((!strcmp(argv[i], "-encode")) ||
(!strcmp(argv[i], "--encode"))) {
i++;
lint->encoding = argv[i];
} else if ((!strcmp(argv[i], "-pretty")) ||
(!strcmp(argv[i], "--pretty"))) {
i++;
if (argv[i] != NULL)
lint->format = atoi(argv[i]);
#ifdef LIBXML_ZLIB_ENABLED
} else if ((!strcmp(argv[i], "-compress")) ||
(!strcmp(argv[i], "--compress"))) {
lint->compress = 1;
#endif
#endif /* LIBXML_OUTPUT_ENABLED */
#ifdef LIBXML_READER_ENABLED
} else if ((!strcmp(argv[i], "-stream")) ||
(!strcmp(argv[i], "--stream"))) {
lint->stream = 1;
} else if ((!strcmp(argv[i], "-walker")) ||
(!strcmp(argv[i], "--walker"))) {
lint->walker = 1;
lint->noout = 1;
#ifdef LIBXML_PATTERN_ENABLED
} else if ((!strcmp(argv[i], "-pattern")) ||
(!strcmp(argv[i], "--pattern"))) {
i++;
lint->pattern = argv[i];
#endif
#endif /* LIBXML_READER_ENABLED */
#ifdef LIBXML_SAX1_ENABLED
} else if ((!strcmp(argv[i], "-sax1")) ||
(!strcmp(argv[i], "--sax1"))) {
lint->options |= XML_PARSE_SAX1;
#endif /* LIBXML_SAX1_ENABLED */
} else if ((!strcmp(argv[i], "-sax")) ||
(!strcmp(argv[i], "--sax"))) {
lint->sax = 1;
#ifdef LIBXML_RELAXNG_ENABLED
} else if ((!strcmp(argv[i], "-relaxng")) ||
(!strcmp(argv[i], "--relaxng"))) {
i++;
lint->relaxng = argv[i];
lint->options |= XML_PARSE_NOENT;
#endif
#ifdef LIBXML_SCHEMAS_ENABLED
} else if ((!strcmp(argv[i], "-schema")) ||
(!strcmp(argv[i], "--schema"))) {
i++;
lint->schema = argv[i];
lint->options |= XML_PARSE_NOENT;
#endif
#ifdef LIBXML_SCHEMATRON_ENABLED
} else if ((!strcmp(argv[i], "-schematron")) ||
(!strcmp(argv[i], "--schematron"))) {
i++;
lint->schematron = argv[i];
lint->options |= XML_PARSE_NOENT;
#endif
} else if ((!strcmp(argv[i], "-nonet")) ||
(!strcmp(argv[i], "--nonet"))) {
lint->options |= XML_PARSE_NONET;
} else if ((!strcmp(argv[i], "-nocompact")) ||
(!strcmp(argv[i], "--nocompact"))) {
lint->options &= ~XML_PARSE_COMPACT;
} else if ((!strcmp(argv[i], "-load-trace")) ||
(!strcmp(argv[i], "--load-trace"))) {
lint->load_trace = 1;
} else if ((!strcmp(argv[i], "-path")) ||
(!strcmp(argv[i], "--path"))) {
i++;
parsePath(lint, BAD_CAST argv[i]);
#ifdef LIBXML_XPATH_ENABLED
} else if ((!strcmp(argv[i], "-xpath")) ||
(!strcmp(argv[i], "--xpath"))) {
i++;
lint->noout++;
lint->xpathquery = argv[i];
#endif
} else if ((!strcmp(argv[i], "-oldxml10")) ||
(!strcmp(argv[i], "--oldxml10"))) {
lint->options |= XML_PARSE_OLD10;
} else if ((!strcmp(argv[i], "-max-ampl")) ||
(!strcmp(argv[i], "--max-ampl"))) {
i++;
if (i >= argc) {
fprintf(errStream, "max-ampl: missing integer value\n");
return(XMLLINT_ERR_UNCLASS);
}
lint->maxAmpl = parseInteger(errStream, "max-ampl", argv[i],
1, UINT_MAX);
} else {
fprintf(errStream, "Unknown option %s\n", argv[i]);
usage(errStream, argv[0]);
return(XMLLINT_ERR_UNCLASS);
}
}
if (lint->shell)
lint->repeat = 1;
return(XMLLINT_RETURN_OK);
}
int
xmllintMain(int argc, const char **argv, FILE *errStream,
xmlResourceLoader loader) {
xmllintState state, *lint;
int i, j, res;
int files = 0;
#ifdef _WIN32
_setmode(_fileno(stdin), _O_BINARY);
_setmode(_fileno(stdout), _O_BINARY);
_setmode(_fileno(stderr), _O_BINARY);
#endif
lint = &state;
xmllintInit(lint);
lint->errStream = errStream;
lint->defaultResourceLoader = loader;
res = xmllintParseOptions(lint, argc, argv);
if (res != XMLLINT_RETURN_OK) {
lint->progresult = res;
goto error;
}
if (lint->maxmem != 0) {
xmllintMaxmem = 0;
xmllintMaxmemReached = 0;
xmllintOom = 0;
xmlMemSetup(myFreeFunc, myMallocFunc, myReallocFunc, myStrdupFunc);
}
LIBXML_TEST_VERSION
#ifdef LIBXML_CATALOG_ENABLED
if (lint->nocatalogs == 0) {
if (lint->catalogs) {
const char *catal;
catal = getenv("SGML_CATALOG_FILES");
if (catal != NULL) {
xmlLoadCatalogs(catal);
} else {
fprintf(errStream, "Variable $SGML_CATALOG_FILES not set\n");
}
}
}
#endif
#ifdef LIBXML_OUTPUT_ENABLED
{
const char *indent = getenv("XMLLINT_INDENT");
if (indent != NULL) {
xmlTreeIndentString = indent;
}
}
#endif
if (lint->htmlout) {
lint->htmlBuf = xmlMalloc(HTML_BUF_SIZE);
if (lint->htmlBuf == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
goto error;
}
if (!lint->nowrap) {
fprintf(errStream,
"<!DOCTYPE HTML PUBLIC \"-//W3C//DTD HTML 4.0 Transitional//EN\"\n");
fprintf(errStream,
"\t\"http://www.w3.org/TR/REC-html40/loose.dtd\">\n");
fprintf(errStream,
"<html><head><title>%s output</title></head>\n",
argv[0]);
fprintf(errStream,
"<body bgcolor=\"#ffffff\"><h1 align=\"center\">%s output</h1>\n",
argv[0]);
}
}
#ifdef LIBXML_SCHEMATRON_ENABLED
if ((lint->schematron != NULL) && (lint->sax == 0)
#ifdef LIBXML_READER_ENABLED
&& (lint->stream == 0)
#endif /* LIBXML_READER_ENABLED */
) {
xmlSchematronParserCtxtPtr ctxt;
/* forces loading the DTDs */
lint->options |= XML_PARSE_DTDLOAD;
if (lint->timing) {
startTimer(lint);
}
ctxt = xmlSchematronNewParserCtxt(lint->schematron);
if (ctxt == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
goto error;
}
lint->wxschematron = xmlSchematronParse(ctxt);
if (lint->wxschematron == NULL) {
fprintf(errStream, "Schematron schema %s failed to compile\n",
lint->schematron);
lint->progresult = XMLLINT_ERR_SCHEMACOMP;
goto error;
}
xmlSchematronFreeParserCtxt(ctxt);
if (lint->timing) {
endTimer(lint, "Compiling the schemas");
}
}
#endif
#ifdef LIBXML_RELAXNG_ENABLED
if ((lint->relaxng != NULL) && (lint->sax == 0)
#ifdef LIBXML_READER_ENABLED
&& (lint->stream == 0)
#endif /* LIBXML_READER_ENABLED */
) {
xmlRelaxNGParserCtxtPtr ctxt;
/* forces loading the DTDs */
lint->options |= XML_PARSE_DTDLOAD;
if (lint->timing) {
startTimer(lint);
}
ctxt = xmlRelaxNGNewParserCtxt(lint->relaxng);
if (ctxt == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
goto error;
}
xmlRelaxNGSetResourceLoader(ctxt, xmllintResourceLoader, lint);
lint->relaxngschemas = xmlRelaxNGParse(ctxt);
if (lint->relaxngschemas == NULL) {
fprintf(errStream, "Relax-NG schema %s failed to compile\n",
lint->relaxng);
lint->progresult = XMLLINT_ERR_SCHEMACOMP;
goto error;
}
xmlRelaxNGFreeParserCtxt(ctxt);
if (lint->timing) {
endTimer(lint, "Compiling the schemas");
}
}
#endif /* LIBXML_RELAXNG_ENABLED */
#ifdef LIBXML_SCHEMAS_ENABLED
if ((lint->schema != NULL)
#ifdef LIBXML_READER_ENABLED
&& (lint->stream == 0)
#endif
) {
xmlSchemaParserCtxtPtr ctxt;
if (lint->timing) {
startTimer(lint);
}
ctxt = xmlSchemaNewParserCtxt(lint->schema);
if (ctxt == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
goto error;
}
xmlSchemaSetResourceLoader(ctxt, xmllintResourceLoader, lint);
lint->wxschemas = xmlSchemaParse(ctxt);
if (lint->wxschemas == NULL) {
fprintf(errStream, "WXS schema %s failed to compile\n",
lint->schema);
lint->progresult = XMLLINT_ERR_SCHEMACOMP;
goto error;
}
xmlSchemaFreeParserCtxt(ctxt);
if (lint->timing) {
endTimer(lint, "Compiling the schemas");
}
}
#endif /* LIBXML_SCHEMAS_ENABLED */
#if defined(LIBXML_READER_ENABLED) && defined(LIBXML_PATTERN_ENABLED)
if ((lint->pattern != NULL) && (lint->walker == 0)) {
res = xmlPatternCompileSafe(BAD_CAST lint->pattern, NULL, 0, NULL,
&lint->patternc);
if (lint->patternc == NULL) {
if (res < 0) {
lint->progresult = XMLLINT_ERR_MEM;
} else {
fprintf(errStream, "Pattern %s failed to compile\n",
lint->pattern);
lint->progresult = XMLLINT_ERR_SCHEMAPAT;
}
goto error;
}
}
#endif /* LIBXML_READER_ENABLED && LIBXML_PATTERN_ENABLED */
/*
* The main loop over input documents
*/
for (i = 1; i < argc ; i++) {
const char *filename = argv[i];
#if HAVE_DECL_MMAP
int memoryFd = -1;
#endif
if ((filename[0] == '-') && (strcmp(filename, "-") != 0)) {
i += skipArgs(filename);
continue;
}
#if HAVE_DECL_MMAP
if (lint->memory) {
struct stat info;
if (stat(filename, &info) < 0) {
lint->progresult = XMLLINT_ERR_RDFILE;
break;
}
memoryFd = open(filename, O_RDONLY);
if (memoryFd < 0) {
lint->progresult = XMLLINT_ERR_RDFILE;
break;
}
lint->memoryData = mmap(NULL, info.st_size, PROT_READ,
MAP_SHARED, memoryFd, 0);
if (lint->memoryData == (void *) MAP_FAILED) {
close(memoryFd);
fprintf(errStream, "mmap failure for file %s\n", filename);
lint->progresult = XMLLINT_ERR_RDFILE;
break;
}
lint->memorySize = info.st_size;
}
#endif /* HAVE_DECL_MMAP */
if ((lint->timing) && (lint->repeat > 1))
startTimer(lint);
#ifdef LIBXML_READER_ENABLED
if (lint->stream != 0) {
for (j = 0; j < lint->repeat; j++)
streamFile(lint, filename);
} else
#endif /* LIBXML_READER_ENABLED */
{
xmlParserCtxtPtr ctxt;
#ifdef LIBXML_HTML_ENABLED
if (lint->html) {
#ifdef LIBXML_PUSH_ENABLED
if (lint->push) {
ctxt = htmlCreatePushParserCtxt(NULL, NULL, NULL, 0,
filename,
XML_CHAR_ENCODING_NONE);
} else
#endif /* LIBXML_PUSH_ENABLED */
{
ctxt = htmlNewParserCtxt();
}
htmlCtxtUseOptions(ctxt, lint->options);
} else
#endif /* LIBXML_HTML_ENABLED */
{
#ifdef LIBXML_PUSH_ENABLED
if (lint->push) {
ctxt = xmlCreatePushParserCtxt(NULL, NULL, NULL, 0,
filename);
} else
#endif /* LIBXML_PUSH_ENABLED */
{
ctxt = xmlNewParserCtxt();
}
xmlCtxtUseOptions(ctxt, lint->options);
}
if (ctxt == NULL) {
lint->progresult = XMLLINT_ERR_MEM;
goto error;
}
if (lint->sax) {
const xmlSAXHandler *handler;
if (lint->noout) {
handler = &emptySAXHandler;
#ifdef LIBXML_SAX1_ENABLED
} else if (lint->options & XML_PARSE_SAX1) {
handler = &debugSAXHandler;
#endif
} else {
handler = &debugSAX2Handler;
}
*ctxt->sax = *handler;
ctxt->userData = lint;
}
xmlCtxtSetResourceLoader(ctxt, xmllintResourceLoader, lint);
if (lint->maxAmpl > 0)
xmlCtxtSetMaxAmplification(ctxt, lint->maxAmpl);
if (lint->htmlout) {
ctxt->_private = lint;
xmlCtxtSetErrorHandler(ctxt, xmlHTMLError, ctxt);
}
lint->ctxt = ctxt;
for (j = 0; j < lint->repeat; j++) {
#ifdef LIBXML_PUSH_ENABLED
if ((lint->push) && (j > 0))
xmlCtxtResetPush(ctxt, NULL, 0, NULL, NULL);
#endif
if (lint->sax) {
testSAX(lint, filename);
} else {
parseAndPrintFile(lint, filename);
}
}
xmlFreeParserCtxt(ctxt);
}
if ((lint->timing) && (lint->repeat > 1)) {
endTimer(lint, "%d iterations", lint->repeat);
}
files += 1;
#if HAVE_DECL_MMAP
if (lint->memory) {
munmap(lint->memoryData, lint->memorySize);
close(memoryFd);
}
#endif
}
if (lint->generate)
parseAndPrintFile(lint, NULL);
if ((lint->htmlout) && (!lint->nowrap)) {
fprintf(errStream, "</body></html>\n");
}
if ((files == 0) && (!lint->generate) && (lint->version == 0)) {
usage(errStream, argv[0]);
lint->progresult = XMLLINT_ERR_UNCLASS;
}
2025-01-17 13:04:35 +01:00
error:
if (lint->htmlout)
xmlFree(lint->htmlBuf);
#ifdef LIBXML_SCHEMATRON_ENABLED
if (lint->wxschematron != NULL)
xmlSchematronFree(lint->wxschematron);
#endif
#ifdef LIBXML_RELAXNG_ENABLED
if (lint->relaxngschemas != NULL)
xmlRelaxNGFree(lint->relaxngschemas);
#endif
#ifdef LIBXML_SCHEMAS_ENABLED
if (lint->wxschemas != NULL)
xmlSchemaFree(lint->wxschemas);
#endif
#if defined(LIBXML_READER_ENABLED) && defined(LIBXML_PATTERN_ENABLED)
if (lint->patternc != NULL)
xmlFreePattern(lint->patternc);
#endif
xmlCleanupParser();
if ((lint->maxmem) && (xmllintMaxmemReached)) {
fprintf(errStream, "Maximum memory exceeded (%d bytes)\n",
xmllintMaxmem);
} else if (lint->progresult == XMLLINT_ERR_MEM) {
fprintf(errStream, "Out-of-memory error reported\n");
}
#ifdef FUZZING_BUILD_MODE_UNSAFE_FOR_PRODUCTION
if ((lint->maxmem) &&
(xmllintOom != (lint->progresult == XMLLINT_ERR_MEM))) {
fprintf(stderr, "xmllint: malloc failure %s reported\n",
xmllintOom ? "not" : "erroneously");
abort();
}
#endif
return(lint->progresult);
}