mirror of
https://gitlab.gnome.org/GNOME/libxml2
synced 2025-03-28 21:33:13 +00:00
Add XPath and XPointer fuzzer
This commit is contained in:
parent
956534e02e
commit
ad26a60f95
5
fuzz/.gitignore
vendored
5
fuzz/.gitignore
vendored
@ -5,9 +5,12 @@ regexp
|
||||
schema
|
||||
schemaSeed
|
||||
seed/html*
|
||||
seed/xml*
|
||||
seed/schema*
|
||||
seed/xml*
|
||||
seed/xpath*
|
||||
testFuzzer
|
||||
uri
|
||||
xml
|
||||
xmlSeed
|
||||
xpath
|
||||
xpathSeed
|
||||
|
@ -1,4 +1,5 @@
|
||||
EXTRA_PROGRAMS = html htmlSeed regexp uri schema schemaSeed xml xmlSeed
|
||||
EXTRA_PROGRAMS = html htmlSeed regexp uri schema schemaSeed xml xmlSeed \
|
||||
xpath xpathSeed
|
||||
check_PROGRAMS = testFuzzer
|
||||
CLEANFILES = $(EXTRA_PROGRAMS)
|
||||
AM_CPPFLAGS = -I$(top_srcdir)/include
|
||||
@ -133,3 +134,23 @@ fuzz-schema: schema$(EXEEXT) seed/schema.stamp
|
||||
-timeout=20 \
|
||||
corpus/schema seed/schema
|
||||
|
||||
# XPath fuzzer
|
||||
|
||||
xpathSeed_SOURCES = xpathSeed.c fuzz.c
|
||||
|
||||
seed/xpath.stamp: xpathSeed$(EXEEXT)
|
||||
@mkdir -p seed/xpath
|
||||
@./xpathSeed$(EXEEXT) "$(top_builddir)/test/XPath"
|
||||
@touch seed/xpath.stamp
|
||||
|
||||
xpath_SOURCES = xpath.c fuzz.c
|
||||
xpath_LDFLAGS = -fsanitize=fuzzer
|
||||
|
||||
fuzz-xpath: xpath$(EXEEXT) seed/xpath.stamp
|
||||
@mkdir -p corpus/xpath
|
||||
./xpath$(EXEEXT) \
|
||||
-dict=xpath.dict \
|
||||
-max_len=10000 \
|
||||
-timeout=20 \
|
||||
corpus/xpath seed/xpath
|
||||
|
||||
|
24
fuzz/fuzz.c
24
fuzz/fuzz.c
@ -122,20 +122,24 @@ xmlFuzzReadRemaining(size_t *size) {
|
||||
}
|
||||
|
||||
/*
|
||||
* Write a random-length string to stdout in a format similar to
|
||||
* xmlFuzzWriteString:
|
||||
* @out: output file
|
||||
* @str: string to write
|
||||
*
|
||||
* Write a random-length string to file in a format similar to
|
||||
* FuzzedDataProvider. Backslash followed by newline marks the end of the
|
||||
* string. Two backslashes are used to escape a backslash.
|
||||
*/
|
||||
static void
|
||||
xmlFuzzWriteString(const char *str) {
|
||||
void
|
||||
xmlFuzzWriteString(FILE *out, const char *str) {
|
||||
for (; *str; str++) {
|
||||
int c = (unsigned char) *str;
|
||||
putchar(c);
|
||||
putc(c, out);
|
||||
if (c == '\\')
|
||||
putchar(c);
|
||||
putc(c, out);
|
||||
}
|
||||
putchar('\\');
|
||||
putchar('\n');
|
||||
putc('\\', out);
|
||||
putc('\n', out);
|
||||
}
|
||||
|
||||
/**
|
||||
@ -150,7 +154,7 @@ xmlFuzzWriteString(const char *str) {
|
||||
*
|
||||
* Returns a zero-terminated string or NULL if the fuzz data is exhausted.
|
||||
*/
|
||||
static const char *
|
||||
const char *
|
||||
xmlFuzzReadString(size_t *size) {
|
||||
const char *out = fuzzData.outPtr;
|
||||
|
||||
@ -217,8 +221,8 @@ xmlFuzzEntityRecorder(const char *URL, const char *ID,
|
||||
}
|
||||
} while (len > 0);
|
||||
|
||||
xmlFuzzWriteString(URL);
|
||||
xmlFuzzWriteString((char *) xmlBufContent(in->buf->buffer));
|
||||
xmlFuzzWriteString(stdout, URL);
|
||||
xmlFuzzWriteString(stdout, (char *) xmlBufContent(in->buf->buffer));
|
||||
|
||||
xmlFreeInputStream(in);
|
||||
|
||||
|
@ -36,6 +36,12 @@ xmlFuzzReadInt(void);
|
||||
const char *
|
||||
xmlFuzzReadRemaining(size_t *size);
|
||||
|
||||
void
|
||||
xmlFuzzWriteString(FILE *out, const char *str);
|
||||
|
||||
const char *
|
||||
xmlFuzzReadString(size_t *size);
|
||||
|
||||
xmlParserInputPtr
|
||||
xmlFuzzEntityRecorder(const char *URL, const char *ID, xmlParserCtxtPtr ctxt);
|
||||
|
||||
|
49
fuzz/xpath.c
Normal file
49
fuzz/xpath.c
Normal file
@ -0,0 +1,49 @@
|
||||
/*
|
||||
* xpath.c: a libFuzzer target to test XPath and XPointer expressions.
|
||||
*
|
||||
* See Copyright for the status of this software.
|
||||
*/
|
||||
|
||||
#include <libxml/parser.h>
|
||||
#include <libxml/xpointer.h>
|
||||
#include "fuzz.h"
|
||||
|
||||
int
|
||||
LLVMFuzzerInitialize(int *argc ATTRIBUTE_UNUSED,
|
||||
char ***argv ATTRIBUTE_UNUSED) {
|
||||
xmlInitParser();
|
||||
xmlSetGenericErrorFunc(NULL, xmlFuzzErrorFunc);
|
||||
|
||||
return 0;
|
||||
}
|
||||
|
||||
int
|
||||
LLVMFuzzerTestOneInput(const char *data, size_t size) {
|
||||
xmlDocPtr doc;
|
||||
const char *expr, *xml;
|
||||
size_t exprSize, xmlSize;
|
||||
|
||||
xmlFuzzDataInit(data, size);
|
||||
|
||||
expr = xmlFuzzReadString(&exprSize);
|
||||
xml = xmlFuzzReadString(&xmlSize);
|
||||
|
||||
doc = xmlParseMemory(xml, xmlSize);
|
||||
if (doc != NULL) {
|
||||
xmlXPathContextPtr xpctxt = xmlXPathNewContext(doc);
|
||||
|
||||
/* Resource limits to avoid timeouts and call stack overflows */
|
||||
xpctxt->maxParserDepth = 15;
|
||||
xpctxt->maxDepth = 100;
|
||||
xpctxt->opLimit = 500000;
|
||||
|
||||
xmlXPathFreeObject(xmlXPtrEval(BAD_CAST expr, xpctxt));
|
||||
xmlXPathFreeContext(xpctxt);
|
||||
}
|
||||
xmlFreeDoc(doc);
|
||||
|
||||
xmlFuzzDataCleanup();
|
||||
|
||||
return(0);
|
||||
}
|
||||
|
94
fuzz/xpath.dict
Normal file
94
fuzz/xpath.dict
Normal file
@ -0,0 +1,94 @@
|
||||
# XML
|
||||
|
||||
elem_a="<a></a>"
|
||||
elem_b="<b></b>"
|
||||
elem_c="<c></c>"
|
||||
elem_d="<d></d>"
|
||||
elem_empty="<a/>"
|
||||
elem_ns_a="<a:a xmlns:a='a'></a:a>"
|
||||
elem_ns_b="<b:b xmlns:b='b'></b:b>"
|
||||
|
||||
attr_a=" a='a'"
|
||||
attr_b=" b='b'"
|
||||
|
||||
ns_decl=" xmlns:a='a'"
|
||||
ns_default=" xmlns='a'"
|
||||
ns_prefix_a="a:"
|
||||
ns_prefix_b="b:"
|
||||
|
||||
cdata_section="<![CDATA[ ]]>"
|
||||
|
||||
comment="<!-- -->"
|
||||
|
||||
pi="<?a?>"
|
||||
|
||||
# XPath
|
||||
|
||||
axis_ancestor="ancestor::"
|
||||
axis_ancestor_or_self="ancestor-or-self::"
|
||||
axis_attribute="attribute::"
|
||||
axis_attribute_abbrev="@"
|
||||
axis_child="child::"
|
||||
axis_descendant="descendant::"
|
||||
axis_descendant_or_self="descendant-or-self::"
|
||||
axis_following="following::"
|
||||
axis_following_sibling="following-sibling::"
|
||||
axis_namespace="namespace::"
|
||||
axis_parent="parent::"
|
||||
axis_preceding="preceding::"
|
||||
axis_preceding_siblings="preceding-sibling::"
|
||||
axis_self="self::"
|
||||
|
||||
node_test_ns="a:"
|
||||
|
||||
val_num="=(1.0)"
|
||||
val_str_sq="=('a')"
|
||||
val_str_dq="=(\"a\")"
|
||||
val_node_set="=(*)"
|
||||
val_elem="=(b)"
|
||||
|
||||
step_root="/"
|
||||
step_descendant="//"
|
||||
step_any="//*"
|
||||
step_any_l="*//"
|
||||
step_elem="//b"
|
||||
step_ns_elem="//a:a"
|
||||
step_comment="//comment()"
|
||||
step_node="//node()"
|
||||
step_node_l="node()//"
|
||||
step_pi="//processing-instruction()"
|
||||
step_text="//text()"
|
||||
step_parent="../"
|
||||
|
||||
op_plus="+1"
|
||||
op_minus=" - 1"
|
||||
op_neg="-"
|
||||
op_mul="*1"
|
||||
op_div=" div 1"
|
||||
op_mod=" mod 1"
|
||||
op_and=" and 1"
|
||||
op_or=" or 1"
|
||||
op_ne="!=1"
|
||||
op_lt="<1"
|
||||
op_gt=">1"
|
||||
op_le="<=1"
|
||||
op_ge=">=1"
|
||||
op_predicate_num="[1]"
|
||||
op_predicate_last="[last()]"
|
||||
op_predicate_str="['a']"
|
||||
op_predicate="[1=1]"
|
||||
op_arg_num=",1"
|
||||
op_arg_str=",'a'"
|
||||
op_arg_node=",*"
|
||||
op_union="|//b"
|
||||
|
||||
var_num="=$f"
|
||||
var_bool="=$b"
|
||||
var_str="=$s"
|
||||
var_node_set="=$n"
|
||||
|
||||
# Unicode
|
||||
|
||||
utf8_2="\xC3\x84"
|
||||
utf8_3="\xE2\x80\x9C"
|
||||
utf8_4="\xF0\x9F\x98\x80"
|
3
fuzz/xpath.options
Normal file
3
fuzz/xpath.options
Normal file
@ -0,0 +1,3 @@
|
||||
[libfuzzer]
|
||||
max_len = 10000
|
||||
timeout = 20
|
171
fuzz/xpathSeed.c
Normal file
171
fuzz/xpathSeed.c
Normal file
@ -0,0 +1,171 @@
|
||||
/*
|
||||
* xpathSeed.c: Generate the XPath and XPointer seed corpus for fuzzing.
|
||||
*
|
||||
* See Copyright for the status of this software.
|
||||
*/
|
||||
|
||||
#include <glob.h>
|
||||
#include <libgen.h>
|
||||
#include <stdio.h>
|
||||
#include <sys/stat.h>
|
||||
#include "fuzz.h"
|
||||
|
||||
#define PATH_SIZE 256
|
||||
#define EXPR_SIZE 4500
|
||||
|
||||
typedef struct {
|
||||
const char *name;
|
||||
const char *prefix;
|
||||
char *data;
|
||||
int counter;
|
||||
} xpathTestXml;
|
||||
|
||||
static int
|
||||
processXml(const char *testDir, xpathTestXml *xml, const char *subdir,
|
||||
int xptr);
|
||||
|
||||
int
|
||||
main(int argc, char **argv) {
|
||||
xpathTestXml xml;
|
||||
char pattern[PATH_SIZE];
|
||||
glob_t globbuf;
|
||||
size_t i, size;
|
||||
int ret = 0;
|
||||
|
||||
if (argc != 2) {
|
||||
fprintf(stderr, "Usage: xpathSeed [TESTDIR]\n");
|
||||
return(1);
|
||||
}
|
||||
|
||||
xml.name = "expr";
|
||||
xml.prefix = "";
|
||||
xml.data = "<d></d>";
|
||||
xml.counter = 1;
|
||||
if (processXml(argv[1], &xml, "expr", 0) != 0)
|
||||
ret = 1;
|
||||
|
||||
size = snprintf(pattern, sizeof(pattern), "%s/docs/*", argv[1]);
|
||||
if (size >= PATH_SIZE)
|
||||
return(1);
|
||||
if (glob(pattern, 0, NULL, &globbuf) != 0)
|
||||
return(1);
|
||||
|
||||
for (i = 0; i < globbuf.gl_pathc; i++) {
|
||||
char *path = globbuf.gl_pathv[i];
|
||||
FILE *xmlFile;
|
||||
struct stat statbuf;
|
||||
|
||||
if ((stat(path, &statbuf) != 0) || (!S_ISREG(statbuf.st_mode)))
|
||||
continue;
|
||||
size = statbuf.st_size;
|
||||
xmlFile = fopen(path, "rb");
|
||||
if (xmlFile == NULL) {
|
||||
ret = 1;
|
||||
continue;
|
||||
}
|
||||
xml.data = xmlMalloc(size + 1);
|
||||
if (xml.data == NULL) {
|
||||
ret = 1;
|
||||
goto close;
|
||||
}
|
||||
if (fread(xml.data, 1, size, xmlFile) != size) {
|
||||
ret = 1;
|
||||
goto free;
|
||||
}
|
||||
xml.data[size] = 0;
|
||||
xml.name = basename(path);
|
||||
xml.prefix = xml.name;
|
||||
xml.counter = 1;
|
||||
|
||||
if (processXml(argv[1], &xml, "tests", 0) != 0)
|
||||
ret = 1;
|
||||
if (processXml(argv[1], &xml, "xptr", 1) != 0)
|
||||
ret = 1;
|
||||
|
||||
free:
|
||||
xmlFree(xml.data);
|
||||
close:
|
||||
fclose(xmlFile);
|
||||
}
|
||||
|
||||
globfree(&globbuf);
|
||||
|
||||
return(ret);
|
||||
}
|
||||
|
||||
static int
|
||||
processXml(const char *testDir, xpathTestXml *xml, const char *subdir,
|
||||
int xptr) {
|
||||
char pattern[PATH_SIZE];
|
||||
glob_t globbuf;
|
||||
size_t i, size;
|
||||
int ret = 0;
|
||||
|
||||
size = snprintf(pattern, sizeof(pattern), "%s/%s/%s*",
|
||||
testDir, subdir, xml->prefix);
|
||||
if (size >= PATH_SIZE)
|
||||
return(-1);
|
||||
if (glob(pattern, 0, NULL, &globbuf) != 0)
|
||||
return(-1);
|
||||
|
||||
for (i = 0; i < globbuf.gl_pathc; i++) {
|
||||
char *path = globbuf.gl_pathv[i];
|
||||
struct stat statbuf;
|
||||
FILE *in;
|
||||
char expr[EXPR_SIZE];
|
||||
|
||||
if ((stat(path, &statbuf) != 0) || (!S_ISREG(statbuf.st_mode)))
|
||||
continue;
|
||||
|
||||
printf("## Processing %s\n", path);
|
||||
in = fopen(path, "rb");
|
||||
if (in == NULL) {
|
||||
ret = -1;
|
||||
continue;
|
||||
}
|
||||
|
||||
while (fgets(expr, EXPR_SIZE, in) > 0) {
|
||||
char outPath[PATH_SIZE];
|
||||
FILE *out;
|
||||
int j;
|
||||
|
||||
for (j = 0; expr[j] != 0; j++)
|
||||
if (expr[j] == '\r' || expr[j] == '\n')
|
||||
break;
|
||||
expr[j] = 0;
|
||||
|
||||
size = snprintf(outPath, sizeof(outPath), "seed/xpath/%s-%d",
|
||||
xml->name, xml->counter);
|
||||
if (size >= PATH_SIZE) {
|
||||
ret = -1;
|
||||
continue;
|
||||
}
|
||||
out = fopen(outPath, "wb");
|
||||
if (out == NULL) {
|
||||
ret = -1;
|
||||
continue;
|
||||
}
|
||||
|
||||
if (xptr) {
|
||||
xmlFuzzWriteString(out, expr);
|
||||
} else {
|
||||
char xptrExpr[EXPR_SIZE+100];
|
||||
|
||||
snprintf(xptrExpr, sizeof(xptrExpr), "xpointer(%s)", expr);
|
||||
xmlFuzzWriteString(out, xptrExpr);
|
||||
}
|
||||
|
||||
xmlFuzzWriteString(out, xml->data);
|
||||
|
||||
fclose(out);
|
||||
xml->counter++;
|
||||
}
|
||||
|
||||
fclose(in);
|
||||
}
|
||||
|
||||
globfree(&globbuf);
|
||||
|
||||
return(ret);
|
||||
}
|
||||
|
Loading…
x
Reference in New Issue
Block a user