1516 lines
48 KiB
C
1516 lines
48 KiB
C
|
/* Copyright (c) 1998, 1999, 2000 Thai Open Source Software Center Ltd
|
||
|
See the file COPYING for copying permission.
|
||
|
|
||
|
runtest.c : run the Expat test suite
|
||
|
*/
|
||
|
|
||
|
#ifdef HAVE_EXPAT_CONFIG_H
|
||
|
#include <expat_config.h>
|
||
|
#endif
|
||
|
|
||
|
#include <assert.h>
|
||
|
#include <stdlib.h>
|
||
|
#include <stdio.h>
|
||
|
#include <string.h>
|
||
|
#include <stdint.h>
|
||
|
|
||
|
#include "expat.h"
|
||
|
#include "chardata.h"
|
||
|
#include "minicheck.h"
|
||
|
|
||
|
#if defined(__amigaos__) && defined(__USE_INLINE__)
|
||
|
#include <proto/expat.h>
|
||
|
#endif
|
||
|
|
||
|
#ifdef XML_LARGE_SIZE
|
||
|
#define XML_FMT_INT_MOD "ll"
|
||
|
#else
|
||
|
#define XML_FMT_INT_MOD "l"
|
||
|
#endif
|
||
|
|
||
|
static XML_Parser parser;
|
||
|
|
||
|
|
||
|
static void
|
||
|
basic_setup(void)
|
||
|
{
|
||
|
parser = XML_ParserCreate(NULL);
|
||
|
if (parser == NULL)
|
||
|
fail("Parser not created.");
|
||
|
}
|
||
|
|
||
|
static void
|
||
|
basic_teardown(void)
|
||
|
{
|
||
|
if (parser != NULL)
|
||
|
XML_ParserFree(parser);
|
||
|
}
|
||
|
|
||
|
/* Generate a failure using the parser state to create an error message;
|
||
|
this should be used when the parser reports an error we weren't
|
||
|
expecting.
|
||
|
*/
|
||
|
static void
|
||
|
_xml_failure(XML_Parser parser, const char *file, int line)
|
||
|
{
|
||
|
char buffer[1024];
|
||
|
enum XML_Error err = XML_GetErrorCode(parser);
|
||
|
sprintf(buffer,
|
||
|
" %d: %s (line %" XML_FMT_INT_MOD "u, offset %"\
|
||
|
XML_FMT_INT_MOD "u)\n reported from %s, line %d\n",
|
||
|
err,
|
||
|
XML_ErrorString(err),
|
||
|
XML_GetCurrentLineNumber(parser),
|
||
|
XML_GetCurrentColumnNumber(parser),
|
||
|
file, line);
|
||
|
_fail_unless(0, file, line, buffer);
|
||
|
}
|
||
|
|
||
|
#define xml_failure(parser) _xml_failure((parser), __FILE__, __LINE__)
|
||
|
|
||
|
static void
|
||
|
_expect_failure(char *text, enum XML_Error errorCode, char *errorMessage,
|
||
|
char *file, int lineno)
|
||
|
{
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_OK)
|
||
|
/* Hackish use of _fail_unless() macro, but let's us report
|
||
|
the right filename and line number. */
|
||
|
_fail_unless(0, file, lineno, errorMessage);
|
||
|
if (XML_GetErrorCode(parser) != errorCode)
|
||
|
_xml_failure(parser, file, lineno);
|
||
|
}
|
||
|
|
||
|
#define expect_failure(text, errorCode, errorMessage) \
|
||
|
_expect_failure((text), (errorCode), (errorMessage), \
|
||
|
__FILE__, __LINE__)
|
||
|
|
||
|
/* Dummy handlers for when we need to set a handler to tickle a bug,
|
||
|
but it doesn't need to do anything.
|
||
|
*/
|
||
|
|
||
|
static void XMLCALL
|
||
|
dummy_start_doctype_handler(void *userData,
|
||
|
const XML_Char *doctypeName,
|
||
|
const XML_Char *sysid,
|
||
|
const XML_Char *pubid,
|
||
|
int has_internal_subset)
|
||
|
{}
|
||
|
|
||
|
static void XMLCALL
|
||
|
dummy_end_doctype_handler(void *userData)
|
||
|
{}
|
||
|
|
||
|
static void XMLCALL
|
||
|
dummy_entity_decl_handler(void *userData,
|
||
|
const XML_Char *entityName,
|
||
|
int is_parameter_entity,
|
||
|
const XML_Char *value,
|
||
|
int value_length,
|
||
|
const XML_Char *base,
|
||
|
const XML_Char *systemId,
|
||
|
const XML_Char *publicId,
|
||
|
const XML_Char *notationName)
|
||
|
{}
|
||
|
|
||
|
static void XMLCALL
|
||
|
dummy_notation_decl_handler(void *userData,
|
||
|
const XML_Char *notationName,
|
||
|
const XML_Char *base,
|
||
|
const XML_Char *systemId,
|
||
|
const XML_Char *publicId)
|
||
|
{}
|
||
|
|
||
|
static void XMLCALL
|
||
|
dummy_element_decl_handler(void *userData,
|
||
|
const XML_Char *name,
|
||
|
XML_Content *model)
|
||
|
{}
|
||
|
|
||
|
static void XMLCALL
|
||
|
dummy_attlist_decl_handler(void *userData,
|
||
|
const XML_Char *elname,
|
||
|
const XML_Char *attname,
|
||
|
const XML_Char *att_type,
|
||
|
const XML_Char *dflt,
|
||
|
int isrequired)
|
||
|
{}
|
||
|
|
||
|
static void XMLCALL
|
||
|
dummy_comment_handler(void *userData, const XML_Char *data)
|
||
|
{}
|
||
|
|
||
|
static void XMLCALL
|
||
|
dummy_pi_handler(void *userData, const XML_Char *target, const XML_Char *data)
|
||
|
{}
|
||
|
|
||
|
static void XMLCALL
|
||
|
dummy_start_element(void *userData,
|
||
|
const XML_Char *name, const XML_Char **atts)
|
||
|
{}
|
||
|
|
||
|
|
||
|
/*
|
||
|
* Character & encoding tests.
|
||
|
*/
|
||
|
|
||
|
START_TEST(test_nul_byte)
|
||
|
{
|
||
|
char text[] = "<doc>\0</doc>";
|
||
|
|
||
|
/* test that a NUL byte (in US-ASCII data) is an error */
|
||
|
if (XML_Parse(parser, text, sizeof(text) - 1, XML_TRUE) == XML_STATUS_OK)
|
||
|
fail("Parser did not report error on NUL-byte.");
|
||
|
if (XML_GetErrorCode(parser) != XML_ERROR_INVALID_TOKEN)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
|
||
|
START_TEST(test_u0000_char)
|
||
|
{
|
||
|
/* test that a NUL byte (in US-ASCII data) is an error */
|
||
|
expect_failure("<doc>�</doc>",
|
||
|
XML_ERROR_BAD_CHAR_REF,
|
||
|
"Parser did not report error on NUL-byte.");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
START_TEST(test_bom_utf8)
|
||
|
{
|
||
|
/* This test is really just making sure we don't core on a UTF-8 BOM. */
|
||
|
char *text = "\357\273\277<e/>";
|
||
|
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
START_TEST(test_bom_utf16_be)
|
||
|
{
|
||
|
char text[] = "\376\377\0<\0e\0/\0>";
|
||
|
|
||
|
if (XML_Parse(parser, text, sizeof(text)-1, XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
START_TEST(test_bom_utf16_le)
|
||
|
{
|
||
|
char text[] = "\377\376<\0e\0/\0>\0";
|
||
|
|
||
|
if (XML_Parse(parser, text, sizeof(text)-1, XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
static void XMLCALL
|
||
|
accumulate_characters(void *userData, const XML_Char *s, int len)
|
||
|
{
|
||
|
CharData_AppendXMLChars((CharData *)userData, s, len);
|
||
|
}
|
||
|
|
||
|
static void XMLCALL
|
||
|
accumulate_attribute(void *userData, const XML_Char *name,
|
||
|
const XML_Char **atts)
|
||
|
{
|
||
|
CharData *storage = (CharData *)userData;
|
||
|
if (storage->count < 0 && atts != NULL && atts[0] != NULL) {
|
||
|
/* "accumulate" the value of the first attribute we see */
|
||
|
CharData_AppendXMLChars(storage, atts[1], -1);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
|
||
|
static void
|
||
|
_run_character_check(XML_Char *text, XML_Char *expected,
|
||
|
const char *file, int line)
|
||
|
{
|
||
|
CharData storage;
|
||
|
|
||
|
CharData_Init(&storage);
|
||
|
XML_SetUserData(parser, &storage);
|
||
|
XML_SetCharacterDataHandler(parser, accumulate_characters);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
_xml_failure(parser, file, line);
|
||
|
CharData_CheckXMLChars(&storage, expected);
|
||
|
}
|
||
|
|
||
|
#define run_character_check(text, expected) \
|
||
|
_run_character_check(text, expected, __FILE__, __LINE__)
|
||
|
|
||
|
static void
|
||
|
_run_attribute_check(XML_Char *text, XML_Char *expected,
|
||
|
const char *file, int line)
|
||
|
{
|
||
|
CharData storage;
|
||
|
|
||
|
CharData_Init(&storage);
|
||
|
XML_SetUserData(parser, &storage);
|
||
|
XML_SetStartElementHandler(parser, accumulate_attribute);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
_xml_failure(parser, file, line);
|
||
|
CharData_CheckXMLChars(&storage, expected);
|
||
|
}
|
||
|
|
||
|
#define run_attribute_check(text, expected) \
|
||
|
_run_attribute_check(text, expected, __FILE__, __LINE__)
|
||
|
|
||
|
/* Regression test for SF bug #491986. */
|
||
|
START_TEST(test_danish_latin1)
|
||
|
{
|
||
|
char *text =
|
||
|
"<?xml version='1.0' encoding='iso-8859-1'?>\n"
|
||
|
"<e>J\xF8rgen \xE6\xF8\xE5\xC6\xD8\xC5</e>";
|
||
|
run_character_check(text,
|
||
|
"J\xC3\xB8rgen \xC3\xA6\xC3\xB8\xC3\xA5\xC3\x86\xC3\x98\xC3\x85");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
|
||
|
/* Regression test for SF bug #514281. */
|
||
|
START_TEST(test_french_charref_hexidecimal)
|
||
|
{
|
||
|
char *text =
|
||
|
"<?xml version='1.0' encoding='iso-8859-1'?>\n"
|
||
|
"<doc>éèàçêÈ</doc>";
|
||
|
run_character_check(text,
|
||
|
"\xC3\xA9\xC3\xA8\xC3\xA0\xC3\xA7\xC3\xAA\xC3\x88");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
START_TEST(test_french_charref_decimal)
|
||
|
{
|
||
|
char *text =
|
||
|
"<?xml version='1.0' encoding='iso-8859-1'?>\n"
|
||
|
"<doc>éèàçêÈ</doc>";
|
||
|
run_character_check(text,
|
||
|
"\xC3\xA9\xC3\xA8\xC3\xA0\xC3\xA7\xC3\xAA\xC3\x88");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
START_TEST(test_french_latin1)
|
||
|
{
|
||
|
char *text =
|
||
|
"<?xml version='1.0' encoding='iso-8859-1'?>\n"
|
||
|
"<doc>\xE9\xE8\xE0\xE7\xEa\xC8</doc>";
|
||
|
run_character_check(text,
|
||
|
"\xC3\xA9\xC3\xA8\xC3\xA0\xC3\xA7\xC3\xAA\xC3\x88");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
START_TEST(test_french_utf8)
|
||
|
{
|
||
|
char *text =
|
||
|
"<?xml version='1.0' encoding='utf-8'?>\n"
|
||
|
"<doc>\xC3\xA9</doc>";
|
||
|
run_character_check(text, "\xC3\xA9");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #600479.
|
||
|
XXX There should be a test that exercises all legal XML Unicode
|
||
|
characters as PCDATA and attribute value content, and XML Name
|
||
|
characters as part of element and attribute names.
|
||
|
*/
|
||
|
START_TEST(test_utf8_false_rejection)
|
||
|
{
|
||
|
char *text = "<doc>\xEF\xBA\xBF</doc>";
|
||
|
run_character_check(text, "\xEF\xBA\xBF");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #477667.
|
||
|
This test assures that any 8-bit character followed by a 7-bit
|
||
|
character will not be mistakenly interpreted as a valid UTF-8
|
||
|
sequence.
|
||
|
*/
|
||
|
START_TEST(test_illegal_utf8)
|
||
|
{
|
||
|
char text[100];
|
||
|
int i;
|
||
|
|
||
|
for (i = 128; i <= 255; ++i) {
|
||
|
sprintf(text, "<e>%ccd</e>", i);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_OK) {
|
||
|
sprintf(text,
|
||
|
"expected token error for '%c' (ordinal %d) in UTF-8 text",
|
||
|
i, i);
|
||
|
fail(text);
|
||
|
}
|
||
|
else if (XML_GetErrorCode(parser) != XML_ERROR_INVALID_TOKEN)
|
||
|
xml_failure(parser);
|
||
|
/* Reset the parser since we use the same parser repeatedly. */
|
||
|
XML_ParserReset(parser, NULL);
|
||
|
}
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
START_TEST(test_utf16)
|
||
|
{
|
||
|
/* <?xml version="1.0" encoding="UTF-16"?>
|
||
|
<doc a='123'>some text</doc>
|
||
|
*/
|
||
|
char text[] =
|
||
|
"\000<\000?\000x\000m\000\154\000 \000v\000e\000r\000s\000i\000o"
|
||
|
"\000n\000=\000'\0001\000.\000\060\000'\000 \000e\000n\000c\000o"
|
||
|
"\000d\000i\000n\000g\000=\000'\000U\000T\000F\000-\0001\000\066"
|
||
|
"\000'\000?\000>\000\n"
|
||
|
"\000<\000d\000o\000c\000 \000a\000=\000'\0001\0002\0003\000'"
|
||
|
"\000>\000s\000o\000m\000e\000 \000t\000e\000x\000t\000<\000/"
|
||
|
"\000d\000o\000c\000>";
|
||
|
if (XML_Parse(parser, text, sizeof(text)-1, XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
START_TEST(test_utf16_le_epilog_newline)
|
||
|
{
|
||
|
unsigned int first_chunk_bytes = 17;
|
||
|
char text[] =
|
||
|
"\xFF\xFE" /* BOM */
|
||
|
"<\000e\000/\000>\000" /* document element */
|
||
|
"\r\000\n\000\r\000\n\000"; /* epilog */
|
||
|
|
||
|
if (first_chunk_bytes >= sizeof(text) - 1)
|
||
|
fail("bad value of first_chunk_bytes");
|
||
|
if ( XML_Parse(parser, text, first_chunk_bytes, XML_FALSE)
|
||
|
== XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
else {
|
||
|
enum XML_Status rc;
|
||
|
rc = XML_Parse(parser, text + first_chunk_bytes,
|
||
|
sizeof(text) - first_chunk_bytes - 1, XML_TRUE);
|
||
|
if (rc == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #481609, #774028. */
|
||
|
START_TEST(test_latin1_umlauts)
|
||
|
{
|
||
|
char *text =
|
||
|
"<?xml version='1.0' encoding='iso-8859-1'?>\n"
|
||
|
"<e a='\xE4 \xF6 \xFC ä ö ü ä ö ü >'\n"
|
||
|
" >\xE4 \xF6 \xFC ä ö ü ä ö ü ></e>";
|
||
|
char *utf8 =
|
||
|
"\xC3\xA4 \xC3\xB6 \xC3\xBC "
|
||
|
"\xC3\xA4 \xC3\xB6 \xC3\xBC "
|
||
|
"\xC3\xA4 \xC3\xB6 \xC3\xBC >";
|
||
|
run_character_check(text, utf8);
|
||
|
XML_ParserReset(parser, NULL);
|
||
|
run_attribute_check(text, utf8);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test #1 for SF bug #653180. */
|
||
|
START_TEST(test_line_number_after_parse)
|
||
|
{
|
||
|
char *text =
|
||
|
"<tag>\n"
|
||
|
"\n"
|
||
|
"\n</tag>";
|
||
|
XML_Size lineno;
|
||
|
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_FALSE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
lineno = XML_GetCurrentLineNumber(parser);
|
||
|
if (lineno != 4) {
|
||
|
char buffer[100];
|
||
|
sprintf(buffer,
|
||
|
"expected 4 lines, saw %" XML_FMT_INT_MOD "u", lineno);
|
||
|
fail(buffer);
|
||
|
}
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test #2 for SF bug #653180. */
|
||
|
START_TEST(test_column_number_after_parse)
|
||
|
{
|
||
|
char *text = "<tag></tag>";
|
||
|
XML_Size colno;
|
||
|
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_FALSE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
colno = XML_GetCurrentColumnNumber(parser);
|
||
|
if (colno != 11) {
|
||
|
char buffer[100];
|
||
|
sprintf(buffer,
|
||
|
"expected 11 columns, saw %" XML_FMT_INT_MOD "u", colno);
|
||
|
fail(buffer);
|
||
|
}
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
static void XMLCALL
|
||
|
start_element_event_handler2(void *userData, const XML_Char *name,
|
||
|
const XML_Char **attr)
|
||
|
{
|
||
|
CharData *storage = (CharData *) userData;
|
||
|
char buffer[100];
|
||
|
|
||
|
sprintf(buffer,
|
||
|
"<%s> at col:%" XML_FMT_INT_MOD "u line:%"\
|
||
|
XML_FMT_INT_MOD "u\n", name,
|
||
|
XML_GetCurrentColumnNumber(parser),
|
||
|
XML_GetCurrentLineNumber(parser));
|
||
|
CharData_AppendString(storage, buffer);
|
||
|
}
|
||
|
|
||
|
static void XMLCALL
|
||
|
end_element_event_handler2(void *userData, const XML_Char *name)
|
||
|
{
|
||
|
CharData *storage = (CharData *) userData;
|
||
|
char buffer[100];
|
||
|
|
||
|
sprintf(buffer,
|
||
|
"</%s> at col:%" XML_FMT_INT_MOD "u line:%"\
|
||
|
XML_FMT_INT_MOD "u\n", name,
|
||
|
XML_GetCurrentColumnNumber(parser),
|
||
|
XML_GetCurrentLineNumber(parser));
|
||
|
CharData_AppendString(storage, buffer);
|
||
|
}
|
||
|
|
||
|
/* Regression test #3 for SF bug #653180. */
|
||
|
START_TEST(test_line_and_column_numbers_inside_handlers)
|
||
|
{
|
||
|
char *text =
|
||
|
"<a>\n" /* Unix end-of-line */
|
||
|
" <b>\r\n" /* Windows end-of-line */
|
||
|
" <c/>\r" /* Mac OS end-of-line */
|
||
|
" </b>\n"
|
||
|
" <d>\n"
|
||
|
" <f/>\n"
|
||
|
" </d>\n"
|
||
|
"</a>";
|
||
|
char *expected =
|
||
|
"<a> at col:0 line:1\n"
|
||
|
"<b> at col:2 line:2\n"
|
||
|
"<c> at col:4 line:3\n"
|
||
|
"</c> at col:8 line:3\n"
|
||
|
"</b> at col:2 line:4\n"
|
||
|
"<d> at col:2 line:5\n"
|
||
|
"<f> at col:4 line:6\n"
|
||
|
"</f> at col:8 line:6\n"
|
||
|
"</d> at col:2 line:7\n"
|
||
|
"</a> at col:0 line:8\n";
|
||
|
CharData storage;
|
||
|
|
||
|
CharData_Init(&storage);
|
||
|
XML_SetUserData(parser, &storage);
|
||
|
XML_SetStartElementHandler(parser, start_element_event_handler2);
|
||
|
XML_SetEndElementHandler(parser, end_element_event_handler2);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
|
||
|
CharData_CheckString(&storage, expected);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test #4 for SF bug #653180. */
|
||
|
START_TEST(test_line_number_after_error)
|
||
|
{
|
||
|
char *text =
|
||
|
"<a>\n"
|
||
|
" <b>\n"
|
||
|
" </a>"; /* missing </b> */
|
||
|
XML_Size lineno;
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_FALSE) != XML_STATUS_ERROR)
|
||
|
fail("Expected a parse error");
|
||
|
|
||
|
lineno = XML_GetCurrentLineNumber(parser);
|
||
|
if (lineno != 3) {
|
||
|
char buffer[100];
|
||
|
sprintf(buffer, "expected 3 lines, saw %" XML_FMT_INT_MOD "u", lineno);
|
||
|
fail(buffer);
|
||
|
}
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test #5 for SF bug #653180. */
|
||
|
START_TEST(test_column_number_after_error)
|
||
|
{
|
||
|
char *text =
|
||
|
"<a>\n"
|
||
|
" <b>\n"
|
||
|
" </a>"; /* missing </b> */
|
||
|
XML_Size colno;
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_FALSE) != XML_STATUS_ERROR)
|
||
|
fail("Expected a parse error");
|
||
|
|
||
|
colno = XML_GetCurrentColumnNumber(parser);
|
||
|
if (colno != 4) {
|
||
|
char buffer[100];
|
||
|
sprintf(buffer,
|
||
|
"expected 4 columns, saw %" XML_FMT_INT_MOD "u", colno);
|
||
|
fail(buffer);
|
||
|
}
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #478332. */
|
||
|
START_TEST(test_really_long_lines)
|
||
|
{
|
||
|
/* This parses an input line longer than INIT_DATA_BUF_SIZE
|
||
|
characters long (defined to be 1024 in xmlparse.c). We take a
|
||
|
really cheesy approach to building the input buffer, because
|
||
|
this avoids writing bugs in buffer-filling code.
|
||
|
*/
|
||
|
char *text =
|
||
|
"<e>"
|
||
|
/* 64 chars */
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
/* until we have at least 1024 characters on the line: */
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"ABCDEFGHIJKLMNOPQRSTUVWXYZabcdefghijklmnopqrstuvwxyz0123456789-+"
|
||
|
"</e>";
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
|
||
|
/*
|
||
|
* Element event tests.
|
||
|
*/
|
||
|
|
||
|
static void XMLCALL
|
||
|
end_element_event_handler(void *userData, const XML_Char *name)
|
||
|
{
|
||
|
CharData *storage = (CharData *) userData;
|
||
|
CharData_AppendString(storage, "/");
|
||
|
CharData_AppendXMLChars(storage, name, -1);
|
||
|
}
|
||
|
|
||
|
START_TEST(test_end_element_events)
|
||
|
{
|
||
|
char *text = "<a><b><c/></b><d><f/></d></a>";
|
||
|
char *expected = "/c/b/f/d/a";
|
||
|
CharData storage;
|
||
|
|
||
|
CharData_Init(&storage);
|
||
|
XML_SetUserData(parser, &storage);
|
||
|
XML_SetEndElementHandler(parser, end_element_event_handler);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
CharData_CheckString(&storage, expected);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
|
||
|
/*
|
||
|
* Attribute tests.
|
||
|
*/
|
||
|
|
||
|
/* Helpers used by the following test; this checks any "attr" and "refs"
|
||
|
attributes to make sure whitespace has been normalized.
|
||
|
|
||
|
Return true if whitespace has been normalized in a string, using
|
||
|
the rules for attribute value normalization. The 'is_cdata' flag
|
||
|
is needed since CDATA attributes don't need to have multiple
|
||
|
whitespace characters collapsed to a single space, while other
|
||
|
attribute data types do. (Section 3.3.3 of the recommendation.)
|
||
|
*/
|
||
|
static int
|
||
|
is_whitespace_normalized(const XML_Char *s, int is_cdata)
|
||
|
{
|
||
|
int blanks = 0;
|
||
|
int at_start = 1;
|
||
|
while (*s) {
|
||
|
if (*s == ' ')
|
||
|
++blanks;
|
||
|
else if (*s == '\t' || *s == '\n' || *s == '\r')
|
||
|
return 0;
|
||
|
else {
|
||
|
if (at_start) {
|
||
|
at_start = 0;
|
||
|
if (blanks && !is_cdata)
|
||
|
/* illegal leading blanks */
|
||
|
return 0;
|
||
|
}
|
||
|
else if (blanks > 1 && !is_cdata)
|
||
|
return 0;
|
||
|
blanks = 0;
|
||
|
}
|
||
|
++s;
|
||
|
}
|
||
|
if (blanks && !is_cdata)
|
||
|
return 0;
|
||
|
return 1;
|
||
|
}
|
||
|
|
||
|
/* Check the attribute whitespace checker: */
|
||
|
static void
|
||
|
testhelper_is_whitespace_normalized(void)
|
||
|
{
|
||
|
assert(is_whitespace_normalized("abc", 0));
|
||
|
assert(is_whitespace_normalized("abc", 1));
|
||
|
assert(is_whitespace_normalized("abc def ghi", 0));
|
||
|
assert(is_whitespace_normalized("abc def ghi", 1));
|
||
|
assert(!is_whitespace_normalized(" abc def ghi", 0));
|
||
|
assert(is_whitespace_normalized(" abc def ghi", 1));
|
||
|
assert(!is_whitespace_normalized("abc def ghi", 0));
|
||
|
assert(is_whitespace_normalized("abc def ghi", 1));
|
||
|
assert(!is_whitespace_normalized("abc def ghi ", 0));
|
||
|
assert(is_whitespace_normalized("abc def ghi ", 1));
|
||
|
assert(!is_whitespace_normalized(" ", 0));
|
||
|
assert(is_whitespace_normalized(" ", 1));
|
||
|
assert(!is_whitespace_normalized("\t", 0));
|
||
|
assert(!is_whitespace_normalized("\t", 1));
|
||
|
assert(!is_whitespace_normalized("\n", 0));
|
||
|
assert(!is_whitespace_normalized("\n", 1));
|
||
|
assert(!is_whitespace_normalized("\r", 0));
|
||
|
assert(!is_whitespace_normalized("\r", 1));
|
||
|
assert(!is_whitespace_normalized("abc\t def", 1));
|
||
|
}
|
||
|
|
||
|
static void XMLCALL
|
||
|
check_attr_contains_normalized_whitespace(void *userData,
|
||
|
const XML_Char *name,
|
||
|
const XML_Char **atts)
|
||
|
{
|
||
|
int i;
|
||
|
for (i = 0; atts[i] != NULL; i += 2) {
|
||
|
const XML_Char *attrname = atts[i];
|
||
|
const XML_Char *value = atts[i + 1];
|
||
|
if (strcmp("attr", attrname) == 0
|
||
|
|| strcmp("ents", attrname) == 0
|
||
|
|| strcmp("refs", attrname) == 0) {
|
||
|
if (!is_whitespace_normalized(value, 0)) {
|
||
|
char buffer[256];
|
||
|
sprintf(buffer, "attribute value not normalized: %s='%s'",
|
||
|
attrname, value);
|
||
|
fail(buffer);
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
}
|
||
|
|
||
|
START_TEST(test_attr_whitespace_normalization)
|
||
|
{
|
||
|
char *text =
|
||
|
"<!DOCTYPE doc [\n"
|
||
|
" <!ATTLIST doc\n"
|
||
|
" attr NMTOKENS #REQUIRED\n"
|
||
|
" ents ENTITIES #REQUIRED\n"
|
||
|
" refs IDREFS #REQUIRED>\n"
|
||
|
"]>\n"
|
||
|
"<doc attr=' a b c\t\td\te\t' refs=' id-1 \t id-2\t\t' \n"
|
||
|
" ents=' ent-1 \t\r\n"
|
||
|
" ent-2 ' >\n"
|
||
|
" <e id='id-1'/>\n"
|
||
|
" <e id='id-2'/>\n"
|
||
|
"</doc>";
|
||
|
|
||
|
XML_SetStartElementHandler(parser,
|
||
|
check_attr_contains_normalized_whitespace);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
|
||
|
/*
|
||
|
* XML declaration tests.
|
||
|
*/
|
||
|
|
||
|
START_TEST(test_xmldecl_misplaced)
|
||
|
{
|
||
|
expect_failure("\n"
|
||
|
"<?xml version='1.0'?>\n"
|
||
|
"<a/>",
|
||
|
XML_ERROR_MISPLACED_XML_PI,
|
||
|
"failed to report misplaced XML declaration");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #584832. */
|
||
|
static int XMLCALL
|
||
|
UnknownEncodingHandler(void *data,const XML_Char *encoding,XML_Encoding *info)
|
||
|
{
|
||
|
if (strcmp(encoding,"unsupported-encoding") == 0) {
|
||
|
int i;
|
||
|
for (i = 0; i < 256; ++i)
|
||
|
info->map[i] = i;
|
||
|
info->data = NULL;
|
||
|
info->convert = NULL;
|
||
|
info->release = NULL;
|
||
|
return XML_STATUS_OK;
|
||
|
}
|
||
|
return XML_STATUS_ERROR;
|
||
|
}
|
||
|
|
||
|
START_TEST(test_unknown_encoding_internal_entity)
|
||
|
{
|
||
|
char *text =
|
||
|
"<?xml version='1.0' encoding='unsupported-encoding'?>\n"
|
||
|
"<!DOCTYPE test [<!ENTITY foo 'bar'>]>\n"
|
||
|
"<test a='&foo;'/>";
|
||
|
|
||
|
XML_SetUnknownEncodingHandler(parser, UnknownEncodingHandler, NULL);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #620106. */
|
||
|
static int XMLCALL
|
||
|
external_entity_loader_set_encoding(XML_Parser parser,
|
||
|
const XML_Char *context,
|
||
|
const XML_Char *base,
|
||
|
const XML_Char *systemId,
|
||
|
const XML_Char *publicId)
|
||
|
{
|
||
|
/* This text says it's an unsupported encoding, but it's really
|
||
|
UTF-8, which we tell Expat using XML_SetEncoding().
|
||
|
*/
|
||
|
char *text =
|
||
|
"<?xml encoding='iso-8859-3'?>"
|
||
|
"\xC3\xA9";
|
||
|
XML_Parser extparser;
|
||
|
|
||
|
extparser = XML_ExternalEntityParserCreate(parser, context, NULL);
|
||
|
if (extparser == NULL)
|
||
|
fail("Could not create external entity parser.");
|
||
|
if (!XML_SetEncoding(extparser, "utf-8"))
|
||
|
fail("XML_SetEncoding() ignored for external entity");
|
||
|
if ( XML_Parse(extparser, text, strlen(text), XML_TRUE)
|
||
|
== XML_STATUS_ERROR) {
|
||
|
xml_failure(parser);
|
||
|
return 0;
|
||
|
}
|
||
|
return 1;
|
||
|
}
|
||
|
|
||
|
START_TEST(test_ext_entity_set_encoding)
|
||
|
{
|
||
|
char *text =
|
||
|
"<!DOCTYPE doc [\n"
|
||
|
" <!ENTITY en SYSTEM 'http://xml.libexpat.org/dummy.ent'>\n"
|
||
|
"]>\n"
|
||
|
"<doc>&en;</doc>";
|
||
|
|
||
|
XML_SetExternalEntityRefHandler(parser,
|
||
|
external_entity_loader_set_encoding);
|
||
|
run_character_check(text, "\xC3\xA9");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Test that no error is reported for unknown entities if we don't
|
||
|
read an external subset. This was fixed in Expat 1.95.5.
|
||
|
*/
|
||
|
START_TEST(test_wfc_undeclared_entity_unread_external_subset) {
|
||
|
char *text =
|
||
|
"<!DOCTYPE doc SYSTEM 'foo'>\n"
|
||
|
"<doc>&entity;</doc>";
|
||
|
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Test that an error is reported for unknown entities if we don't
|
||
|
have an external subset.
|
||
|
*/
|
||
|
START_TEST(test_wfc_undeclared_entity_no_external_subset) {
|
||
|
expect_failure("<doc>&entity;</doc>",
|
||
|
XML_ERROR_UNDEFINED_ENTITY,
|
||
|
"Parser did not report undefined entity w/out a DTD.");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Test that an error is reported for unknown entities if we don't
|
||
|
read an external subset, but have been declared standalone.
|
||
|
*/
|
||
|
START_TEST(test_wfc_undeclared_entity_standalone) {
|
||
|
char *text =
|
||
|
"<?xml version='1.0' encoding='us-ascii' standalone='yes'?>\n"
|
||
|
"<!DOCTYPE doc SYSTEM 'foo'>\n"
|
||
|
"<doc>&entity;</doc>";
|
||
|
|
||
|
expect_failure(text,
|
||
|
XML_ERROR_UNDEFINED_ENTITY,
|
||
|
"Parser did not report undefined entity (standalone).");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
static int XMLCALL
|
||
|
external_entity_loader(XML_Parser parser,
|
||
|
const XML_Char *context,
|
||
|
const XML_Char *base,
|
||
|
const XML_Char *systemId,
|
||
|
const XML_Char *publicId)
|
||
|
{
|
||
|
char *text = (char *)XML_GetUserData(parser);
|
||
|
XML_Parser extparser;
|
||
|
|
||
|
extparser = XML_ExternalEntityParserCreate(parser, context, NULL);
|
||
|
if (extparser == NULL)
|
||
|
fail("Could not create external entity parser.");
|
||
|
if ( XML_Parse(extparser, text, strlen(text), XML_TRUE)
|
||
|
== XML_STATUS_ERROR) {
|
||
|
xml_failure(parser);
|
||
|
return XML_STATUS_ERROR;
|
||
|
}
|
||
|
return XML_STATUS_OK;
|
||
|
}
|
||
|
|
||
|
/* Test that an error is reported for unknown entities if we have read
|
||
|
an external subset, and standalone is true.
|
||
|
*/
|
||
|
START_TEST(test_wfc_undeclared_entity_with_external_subset_standalone) {
|
||
|
char *text =
|
||
|
"<?xml version='1.0' encoding='us-ascii' standalone='yes'?>\n"
|
||
|
"<!DOCTYPE doc SYSTEM 'foo'>\n"
|
||
|
"<doc>&entity;</doc>";
|
||
|
char *foo_text =
|
||
|
"<!ELEMENT doc (#PCDATA)*>";
|
||
|
|
||
|
XML_SetParamEntityParsing(parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
|
||
|
XML_SetUserData(parser, foo_text);
|
||
|
XML_SetExternalEntityRefHandler(parser, external_entity_loader);
|
||
|
expect_failure(text,
|
||
|
XML_ERROR_UNDEFINED_ENTITY,
|
||
|
"Parser did not report undefined entity (external DTD).");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Test that no error is reported for unknown entities if we have read
|
||
|
an external subset, and standalone is false.
|
||
|
*/
|
||
|
START_TEST(test_wfc_undeclared_entity_with_external_subset) {
|
||
|
char *text =
|
||
|
"<?xml version='1.0' encoding='us-ascii'?>\n"
|
||
|
"<!DOCTYPE doc SYSTEM 'foo'>\n"
|
||
|
"<doc>&entity;</doc>";
|
||
|
char *foo_text =
|
||
|
"<!ELEMENT doc (#PCDATA)*>";
|
||
|
|
||
|
XML_SetParamEntityParsing(parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
|
||
|
XML_SetUserData(parser, foo_text);
|
||
|
XML_SetExternalEntityRefHandler(parser, external_entity_loader);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
START_TEST(test_wfc_no_recursive_entity_refs)
|
||
|
{
|
||
|
char *text =
|
||
|
"<!DOCTYPE doc [\n"
|
||
|
" <!ENTITY entity '&entity;'>\n"
|
||
|
"]>\n"
|
||
|
"<doc>&entity;</doc>";
|
||
|
|
||
|
expect_failure(text,
|
||
|
XML_ERROR_RECURSIVE_ENTITY_REF,
|
||
|
"Parser did not report recursive entity reference.");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #483514. */
|
||
|
START_TEST(test_dtd_default_handling)
|
||
|
{
|
||
|
char *text =
|
||
|
"<!DOCTYPE doc [\n"
|
||
|
"<!ENTITY e SYSTEM 'http://xml.libexpat.org/e'>\n"
|
||
|
"<!NOTATION n SYSTEM 'http://xml.libexpat.org/n'>\n"
|
||
|
"<!ELEMENT doc EMPTY>\n"
|
||
|
"<!ATTLIST doc a CDATA #IMPLIED>\n"
|
||
|
"<?pi in dtd?>\n"
|
||
|
"<!--comment in dtd-->\n"
|
||
|
"]><doc/>";
|
||
|
|
||
|
XML_SetDefaultHandler(parser, accumulate_characters);
|
||
|
XML_SetDoctypeDeclHandler(parser,
|
||
|
dummy_start_doctype_handler,
|
||
|
dummy_end_doctype_handler);
|
||
|
XML_SetEntityDeclHandler(parser, dummy_entity_decl_handler);
|
||
|
XML_SetNotationDeclHandler(parser, dummy_notation_decl_handler);
|
||
|
XML_SetElementDeclHandler(parser, dummy_element_decl_handler);
|
||
|
XML_SetAttlistDeclHandler(parser, dummy_attlist_decl_handler);
|
||
|
XML_SetProcessingInstructionHandler(parser, dummy_pi_handler);
|
||
|
XML_SetCommentHandler(parser, dummy_comment_handler);
|
||
|
run_character_check(text, "\n\n\n\n\n\n\n<doc/>");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* See related SF bug #673791.
|
||
|
When namespace processing is enabled, setting the namespace URI for
|
||
|
a prefix is not allowed; this test ensures that it *is* allowed
|
||
|
when namespace processing is not enabled.
|
||
|
(See Namespaces in XML, section 2.)
|
||
|
*/
|
||
|
START_TEST(test_empty_ns_without_namespaces)
|
||
|
{
|
||
|
char *text =
|
||
|
"<doc xmlns:prefix='http://www.example.com/'>\n"
|
||
|
" <e xmlns:prefix=''/>\n"
|
||
|
"</doc>";
|
||
|
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #824420.
|
||
|
Checks that an xmlns:prefix attribute set in an attribute's default
|
||
|
value isn't misinterpreted.
|
||
|
*/
|
||
|
START_TEST(test_ns_in_attribute_default_without_namespaces)
|
||
|
{
|
||
|
char *text =
|
||
|
"<!DOCTYPE e:element [\n"
|
||
|
" <!ATTLIST e:element\n"
|
||
|
" xmlns:e CDATA 'http://example.com/'>\n"
|
||
|
" ]>\n"
|
||
|
"<e:element/>";
|
||
|
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
static char *long_character_data_text =
|
||
|
"<?xml version='1.0' encoding='iso-8859-1'?><s>"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"012345678901234567890123456789012345678901234567890123456789"
|
||
|
"</s>";
|
||
|
|
||
|
static XML_Bool resumable = XML_FALSE;
|
||
|
|
||
|
static void
|
||
|
clearing_aborting_character_handler(void *userData,
|
||
|
const XML_Char *s, int len)
|
||
|
{
|
||
|
XML_StopParser(parser, resumable);
|
||
|
XML_SetCharacterDataHandler(parser, NULL);
|
||
|
}
|
||
|
|
||
|
/* Regression test for SF bug #1515266: missing check of stopped
|
||
|
parser in doContext() 'for' loop. */
|
||
|
START_TEST(test_stop_parser_between_char_data_calls)
|
||
|
{
|
||
|
/* The sample data must be big enough that there are two calls to
|
||
|
the character data handler from within the inner "for" loop of
|
||
|
the XML_TOK_DATA_CHARS case in doContent(), and the character
|
||
|
handler must stop the parser and clear the character data
|
||
|
handler.
|
||
|
*/
|
||
|
char *text = long_character_data_text;
|
||
|
|
||
|
XML_SetCharacterDataHandler(parser, clearing_aborting_character_handler);
|
||
|
resumable = XML_FALSE;
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) != XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
if (XML_GetErrorCode(parser) != XML_ERROR_ABORTED)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #1515266: missing check of stopped
|
||
|
parser in doContext() 'for' loop. */
|
||
|
START_TEST(test_suspend_parser_between_char_data_calls)
|
||
|
{
|
||
|
/* The sample data must be big enough that there are two calls to
|
||
|
the character data handler from within the inner "for" loop of
|
||
|
the XML_TOK_DATA_CHARS case in doContent(), and the character
|
||
|
handler must stop the parser and clear the character data
|
||
|
handler.
|
||
|
*/
|
||
|
char *text = long_character_data_text;
|
||
|
|
||
|
XML_SetCharacterDataHandler(parser, clearing_aborting_character_handler);
|
||
|
resumable = XML_TRUE;
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) != XML_STATUS_SUSPENDED)
|
||
|
xml_failure(parser);
|
||
|
if (XML_GetErrorCode(parser) != XML_ERROR_NONE)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
|
||
|
/*
|
||
|
* Namespaces tests.
|
||
|
*/
|
||
|
|
||
|
static void
|
||
|
namespace_setup(void)
|
||
|
{
|
||
|
parser = XML_ParserCreateNS(NULL, ' ');
|
||
|
if (parser == NULL)
|
||
|
fail("Parser not created.");
|
||
|
}
|
||
|
|
||
|
static void
|
||
|
namespace_teardown(void)
|
||
|
{
|
||
|
basic_teardown();
|
||
|
}
|
||
|
|
||
|
/* Check that an element name and attribute name match the expected values.
|
||
|
The expected values are passed as an array reference of string pointers
|
||
|
provided as the userData argument; the first is the expected
|
||
|
element name, and the second is the expected attribute name.
|
||
|
*/
|
||
|
static void XMLCALL
|
||
|
triplet_start_checker(void *userData, const XML_Char *name,
|
||
|
const XML_Char **atts)
|
||
|
{
|
||
|
char **elemstr = (char **)userData;
|
||
|
char buffer[1024];
|
||
|
if (strcmp(elemstr[0], name) != 0) {
|
||
|
sprintf(buffer, "unexpected start string: '%s'", name);
|
||
|
fail(buffer);
|
||
|
}
|
||
|
if (strcmp(elemstr[1], atts[0]) != 0) {
|
||
|
sprintf(buffer, "unexpected attribute string: '%s'", atts[0]);
|
||
|
fail(buffer);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
/* Check that the element name passed to the end-element handler matches
|
||
|
the expected value. The expected value is passed as the first element
|
||
|
in an array of strings passed as the userData argument.
|
||
|
*/
|
||
|
static void XMLCALL
|
||
|
triplet_end_checker(void *userData, const XML_Char *name)
|
||
|
{
|
||
|
char **elemstr = (char **)userData;
|
||
|
if (strcmp(elemstr[0], name) != 0) {
|
||
|
char buffer[1024];
|
||
|
sprintf(buffer, "unexpected end string: '%s'", name);
|
||
|
fail(buffer);
|
||
|
}
|
||
|
}
|
||
|
|
||
|
START_TEST(test_return_ns_triplet)
|
||
|
{
|
||
|
char *text =
|
||
|
"<foo:e xmlns:foo='http://expat.sf.net/' bar:a='12'\n"
|
||
|
" xmlns:bar='http://expat.sf.net/'></foo:e>";
|
||
|
char *elemstr[] = {
|
||
|
"http://expat.sf.net/ e foo",
|
||
|
"http://expat.sf.net/ a bar"
|
||
|
};
|
||
|
XML_SetReturnNSTriplet(parser, XML_TRUE);
|
||
|
XML_SetUserData(parser, elemstr);
|
||
|
XML_SetElementHandler(parser, triplet_start_checker, triplet_end_checker);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
static void XMLCALL
|
||
|
overwrite_start_checker(void *userData, const XML_Char *name,
|
||
|
const XML_Char **atts)
|
||
|
{
|
||
|
CharData *storage = (CharData *) userData;
|
||
|
CharData_AppendString(storage, "start ");
|
||
|
CharData_AppendXMLChars(storage, name, -1);
|
||
|
while (*atts != NULL) {
|
||
|
CharData_AppendString(storage, "\nattribute ");
|
||
|
CharData_AppendXMLChars(storage, *atts, -1);
|
||
|
atts += 2;
|
||
|
}
|
||
|
CharData_AppendString(storage, "\n");
|
||
|
}
|
||
|
|
||
|
static void XMLCALL
|
||
|
overwrite_end_checker(void *userData, const XML_Char *name)
|
||
|
{
|
||
|
CharData *storage = (CharData *) userData;
|
||
|
CharData_AppendString(storage, "end ");
|
||
|
CharData_AppendXMLChars(storage, name, -1);
|
||
|
CharData_AppendString(storage, "\n");
|
||
|
}
|
||
|
|
||
|
static void
|
||
|
run_ns_tagname_overwrite_test(char *text, char *result)
|
||
|
{
|
||
|
CharData storage;
|
||
|
CharData_Init(&storage);
|
||
|
XML_SetUserData(parser, &storage);
|
||
|
XML_SetElementHandler(parser,
|
||
|
overwrite_start_checker, overwrite_end_checker);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
CharData_CheckString(&storage, result);
|
||
|
}
|
||
|
|
||
|
/* Regression test for SF bug #566334. */
|
||
|
START_TEST(test_ns_tagname_overwrite)
|
||
|
{
|
||
|
char *text =
|
||
|
"<n:e xmlns:n='http://xml.libexpat.org/'>\n"
|
||
|
" <n:f n:attr='foo'/>\n"
|
||
|
" <n:g n:attr2='bar'/>\n"
|
||
|
"</n:e>";
|
||
|
char *result =
|
||
|
"start http://xml.libexpat.org/ e\n"
|
||
|
"start http://xml.libexpat.org/ f\n"
|
||
|
"attribute http://xml.libexpat.org/ attr\n"
|
||
|
"end http://xml.libexpat.org/ f\n"
|
||
|
"start http://xml.libexpat.org/ g\n"
|
||
|
"attribute http://xml.libexpat.org/ attr2\n"
|
||
|
"end http://xml.libexpat.org/ g\n"
|
||
|
"end http://xml.libexpat.org/ e\n";
|
||
|
run_ns_tagname_overwrite_test(text, result);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #566334. */
|
||
|
START_TEST(test_ns_tagname_overwrite_triplet)
|
||
|
{
|
||
|
char *text =
|
||
|
"<n:e xmlns:n='http://xml.libexpat.org/'>\n"
|
||
|
" <n:f n:attr='foo'/>\n"
|
||
|
" <n:g n:attr2='bar'/>\n"
|
||
|
"</n:e>";
|
||
|
char *result =
|
||
|
"start http://xml.libexpat.org/ e n\n"
|
||
|
"start http://xml.libexpat.org/ f n\n"
|
||
|
"attribute http://xml.libexpat.org/ attr n\n"
|
||
|
"end http://xml.libexpat.org/ f n\n"
|
||
|
"start http://xml.libexpat.org/ g n\n"
|
||
|
"attribute http://xml.libexpat.org/ attr2 n\n"
|
||
|
"end http://xml.libexpat.org/ g n\n"
|
||
|
"end http://xml.libexpat.org/ e n\n";
|
||
|
XML_SetReturnNSTriplet(parser, XML_TRUE);
|
||
|
run_ns_tagname_overwrite_test(text, result);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
|
||
|
/* Regression test for SF bug #620343. */
|
||
|
static void XMLCALL
|
||
|
start_element_fail(void *userData,
|
||
|
const XML_Char *name, const XML_Char **atts)
|
||
|
{
|
||
|
/* We should never get here. */
|
||
|
fail("should never reach start_element_fail()");
|
||
|
}
|
||
|
|
||
|
static void XMLCALL
|
||
|
start_ns_clearing_start_element(void *userData,
|
||
|
const XML_Char *prefix,
|
||
|
const XML_Char *uri)
|
||
|
{
|
||
|
XML_SetStartElementHandler((XML_Parser) userData, NULL);
|
||
|
}
|
||
|
|
||
|
START_TEST(test_start_ns_clears_start_element)
|
||
|
{
|
||
|
/* This needs to use separate start/end tags; using the empty tag
|
||
|
syntax doesn't cause the problematic path through Expat to be
|
||
|
taken.
|
||
|
*/
|
||
|
char *text = "<e xmlns='http://xml.libexpat.org/'></e>";
|
||
|
|
||
|
XML_SetStartElementHandler(parser, start_element_fail);
|
||
|
XML_SetStartNamespaceDeclHandler(parser, start_ns_clearing_start_element);
|
||
|
XML_UseParserAsHandlerArg(parser);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #616863. */
|
||
|
static int XMLCALL
|
||
|
external_entity_handler(XML_Parser parser,
|
||
|
const XML_Char *context,
|
||
|
const XML_Char *base,
|
||
|
const XML_Char *systemId,
|
||
|
const XML_Char *publicId)
|
||
|
{
|
||
|
intptr_t callno = 1 + (intptr_t)XML_GetUserData(parser);
|
||
|
char *text;
|
||
|
XML_Parser p2;
|
||
|
|
||
|
if (callno == 1)
|
||
|
text = ("<!ELEMENT doc (e+)>\n"
|
||
|
"<!ATTLIST doc xmlns CDATA #IMPLIED>\n"
|
||
|
"<!ELEMENT e EMPTY>\n");
|
||
|
else
|
||
|
text = ("<?xml version='1.0' encoding='us-ascii'?>"
|
||
|
"<e/>");
|
||
|
|
||
|
XML_SetUserData(parser, (void *) callno);
|
||
|
p2 = XML_ExternalEntityParserCreate(parser, context, NULL);
|
||
|
if (XML_Parse(p2, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR) {
|
||
|
xml_failure(p2);
|
||
|
return 0;
|
||
|
}
|
||
|
XML_ParserFree(p2);
|
||
|
return 1;
|
||
|
}
|
||
|
|
||
|
START_TEST(test_default_ns_from_ext_subset_and_ext_ge)
|
||
|
{
|
||
|
char *text =
|
||
|
"<?xml version='1.0'?>\n"
|
||
|
"<!DOCTYPE doc SYSTEM 'http://xml.libexpat.org/doc.dtd' [\n"
|
||
|
" <!ENTITY en SYSTEM 'http://xml.libexpat.org/entity.ent'>\n"
|
||
|
"]>\n"
|
||
|
"<doc xmlns='http://xml.libexpat.org/ns1'>\n"
|
||
|
"&en;\n"
|
||
|
"</doc>";
|
||
|
|
||
|
XML_SetParamEntityParsing(parser, XML_PARAM_ENTITY_PARSING_ALWAYS);
|
||
|
XML_SetExternalEntityRefHandler(parser, external_entity_handler);
|
||
|
/* We actually need to set this handler to tickle this bug. */
|
||
|
XML_SetStartElementHandler(parser, dummy_start_element);
|
||
|
XML_SetUserData(parser, NULL);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test #1 for SF bug #673791. */
|
||
|
START_TEST(test_ns_prefix_with_empty_uri_1)
|
||
|
{
|
||
|
char *text =
|
||
|
"<doc xmlns:prefix='http://xml.libexpat.org/'>\n"
|
||
|
" <e xmlns:prefix=''/>\n"
|
||
|
"</doc>";
|
||
|
|
||
|
expect_failure(text,
|
||
|
XML_ERROR_UNDECLARING_PREFIX,
|
||
|
"Did not report re-setting namespace"
|
||
|
" URI with prefix to ''.");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test #2 for SF bug #673791. */
|
||
|
START_TEST(test_ns_prefix_with_empty_uri_2)
|
||
|
{
|
||
|
char *text =
|
||
|
"<?xml version='1.0'?>\n"
|
||
|
"<docelem xmlns:pre=''/>";
|
||
|
|
||
|
expect_failure(text,
|
||
|
XML_ERROR_UNDECLARING_PREFIX,
|
||
|
"Did not report setting namespace URI with prefix to ''.");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test #3 for SF bug #673791. */
|
||
|
START_TEST(test_ns_prefix_with_empty_uri_3)
|
||
|
{
|
||
|
char *text =
|
||
|
"<!DOCTYPE doc [\n"
|
||
|
" <!ELEMENT doc EMPTY>\n"
|
||
|
" <!ATTLIST doc\n"
|
||
|
" xmlns:prefix CDATA ''>\n"
|
||
|
"]>\n"
|
||
|
"<doc/>";
|
||
|
|
||
|
expect_failure(text,
|
||
|
XML_ERROR_UNDECLARING_PREFIX,
|
||
|
"Didn't report attr default setting NS w/ prefix to ''.");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test #4 for SF bug #673791. */
|
||
|
START_TEST(test_ns_prefix_with_empty_uri_4)
|
||
|
{
|
||
|
char *text =
|
||
|
"<!DOCTYPE doc [\n"
|
||
|
" <!ELEMENT prefix:doc EMPTY>\n"
|
||
|
" <!ATTLIST prefix:doc\n"
|
||
|
" xmlns:prefix CDATA 'http://xml.libexpat.org/'>\n"
|
||
|
"]>\n"
|
||
|
"<prefix:doc/>";
|
||
|
/* Packaged info expected by the end element handler;
|
||
|
the weird structuring lets us re-use the triplet_end_checker()
|
||
|
function also used for another test. */
|
||
|
char *elemstr[] = {
|
||
|
"http://xml.libexpat.org/ doc prefix"
|
||
|
};
|
||
|
XML_SetReturnNSTriplet(parser, XML_TRUE);
|
||
|
XML_SetUserData(parser, elemstr);
|
||
|
XML_SetEndElementHandler(parser, triplet_end_checker);
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
START_TEST(test_ns_default_with_empty_uri)
|
||
|
{
|
||
|
char *text =
|
||
|
"<doc xmlns='http://xml.libexpat.org/'>\n"
|
||
|
" <e xmlns=''/>\n"
|
||
|
"</doc>";
|
||
|
if (XML_Parse(parser, text, strlen(text), XML_TRUE) == XML_STATUS_ERROR)
|
||
|
xml_failure(parser);
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #692964: two prefixes for one namespace. */
|
||
|
START_TEST(test_ns_duplicate_attrs_diff_prefixes)
|
||
|
{
|
||
|
char *text =
|
||
|
"<doc xmlns:a='http://xml.libexpat.org/a'\n"
|
||
|
" xmlns:b='http://xml.libexpat.org/a'\n"
|
||
|
" a:a='v' b:a='v' />";
|
||
|
expect_failure(text,
|
||
|
XML_ERROR_DUPLICATE_ATTRIBUTE,
|
||
|
"did not report multiple attributes with same URI+name");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #695401: unbound prefix. */
|
||
|
START_TEST(test_ns_unbound_prefix_on_attribute)
|
||
|
{
|
||
|
char *text = "<doc a:attr=''/>";
|
||
|
expect_failure(text,
|
||
|
XML_ERROR_UNBOUND_PREFIX,
|
||
|
"did not report unbound prefix on attribute");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
/* Regression test for SF bug #695401: unbound prefix. */
|
||
|
START_TEST(test_ns_unbound_prefix_on_element)
|
||
|
{
|
||
|
char *text = "<a:doc/>";
|
||
|
expect_failure(text,
|
||
|
XML_ERROR_UNBOUND_PREFIX,
|
||
|
"did not report unbound prefix on element");
|
||
|
}
|
||
|
END_TEST
|
||
|
|
||
|
static Suite *
|
||
|
make_suite(void)
|
||
|
{
|
||
|
Suite *s = suite_create("basic");
|
||
|
TCase *tc_basic = tcase_create("basic tests");
|
||
|
TCase *tc_namespace = tcase_create("XML namespaces");
|
||
|
|
||
|
suite_add_tcase(s, tc_basic);
|
||
|
tcase_add_checked_fixture(tc_basic, basic_setup, basic_teardown);
|
||
|
tcase_add_test(tc_basic, test_nul_byte);
|
||
|
tcase_add_test(tc_basic, test_u0000_char);
|
||
|
tcase_add_test(tc_basic, test_bom_utf8);
|
||
|
tcase_add_test(tc_basic, test_bom_utf16_be);
|
||
|
tcase_add_test(tc_basic, test_bom_utf16_le);
|
||
|
tcase_add_test(tc_basic, test_illegal_utf8);
|
||
|
tcase_add_test(tc_basic, test_utf16);
|
||
|
tcase_add_test(tc_basic, test_utf16_le_epilog_newline);
|
||
|
tcase_add_test(tc_basic, test_latin1_umlauts);
|
||
|
/* Regression test for SF bug #491986. */
|
||
|
tcase_add_test(tc_basic, test_danish_latin1);
|
||
|
/* Regression test for SF bug #514281. */
|
||
|
tcase_add_test(tc_basic, test_french_charref_hexidecimal);
|
||
|
tcase_add_test(tc_basic, test_french_charref_decimal);
|
||
|
tcase_add_test(tc_basic, test_french_latin1);
|
||
|
tcase_add_test(tc_basic, test_french_utf8);
|
||
|
tcase_add_test(tc_basic, test_utf8_false_rejection);
|
||
|
tcase_add_test(tc_basic, test_line_number_after_parse);
|
||
|
tcase_add_test(tc_basic, test_column_number_after_parse);
|
||
|
tcase_add_test(tc_basic, test_line_and_column_numbers_inside_handlers);
|
||
|
tcase_add_test(tc_basic, test_line_number_after_error);
|
||
|
tcase_add_test(tc_basic, test_column_number_after_error);
|
||
|
tcase_add_test(tc_basic, test_really_long_lines);
|
||
|
tcase_add_test(tc_basic, test_end_element_events);
|
||
|
tcase_add_test(tc_basic, test_attr_whitespace_normalization);
|
||
|
tcase_add_test(tc_basic, test_xmldecl_misplaced);
|
||
|
tcase_add_test(tc_basic, test_unknown_encoding_internal_entity);
|
||
|
tcase_add_test(tc_basic,
|
||
|
test_wfc_undeclared_entity_unread_external_subset);
|
||
|
tcase_add_test(tc_basic, test_wfc_undeclared_entity_no_external_subset);
|
||
|
tcase_add_test(tc_basic, test_wfc_undeclared_entity_standalone);
|
||
|
tcase_add_test(tc_basic, test_wfc_undeclared_entity_with_external_subset);
|
||
|
tcase_add_test(tc_basic,
|
||
|
test_wfc_undeclared_entity_with_external_subset_standalone);
|
||
|
tcase_add_test(tc_basic, test_wfc_no_recursive_entity_refs);
|
||
|
tcase_add_test(tc_basic, test_ext_entity_set_encoding);
|
||
|
tcase_add_test(tc_basic, test_dtd_default_handling);
|
||
|
tcase_add_test(tc_basic, test_empty_ns_without_namespaces);
|
||
|
tcase_add_test(tc_basic, test_ns_in_attribute_default_without_namespaces);
|
||
|
tcase_add_test(tc_basic, test_stop_parser_between_char_data_calls);
|
||
|
tcase_add_test(tc_basic, test_suspend_parser_between_char_data_calls);
|
||
|
|
||
|
suite_add_tcase(s, tc_namespace);
|
||
|
tcase_add_checked_fixture(tc_namespace,
|
||
|
namespace_setup, namespace_teardown);
|
||
|
tcase_add_test(tc_namespace, test_return_ns_triplet);
|
||
|
tcase_add_test(tc_namespace, test_ns_tagname_overwrite);
|
||
|
tcase_add_test(tc_namespace, test_ns_tagname_overwrite_triplet);
|
||
|
tcase_add_test(tc_namespace, test_start_ns_clears_start_element);
|
||
|
tcase_add_test(tc_namespace, test_default_ns_from_ext_subset_and_ext_ge);
|
||
|
tcase_add_test(tc_namespace, test_ns_prefix_with_empty_uri_1);
|
||
|
tcase_add_test(tc_namespace, test_ns_prefix_with_empty_uri_2);
|
||
|
tcase_add_test(tc_namespace, test_ns_prefix_with_empty_uri_3);
|
||
|
tcase_add_test(tc_namespace, test_ns_prefix_with_empty_uri_4);
|
||
|
tcase_add_test(tc_namespace, test_ns_default_with_empty_uri);
|
||
|
tcase_add_test(tc_namespace, test_ns_duplicate_attrs_diff_prefixes);
|
||
|
tcase_add_test(tc_namespace, test_ns_unbound_prefix_on_attribute);
|
||
|
tcase_add_test(tc_namespace, test_ns_unbound_prefix_on_element);
|
||
|
|
||
|
return s;
|
||
|
}
|
||
|
|
||
|
|
||
|
int
|
||
|
main(int argc, char *argv[])
|
||
|
{
|
||
|
int i, nf;
|
||
|
int verbosity = CK_NORMAL;
|
||
|
Suite *s = make_suite();
|
||
|
SRunner *sr = srunner_create(s);
|
||
|
|
||
|
/* run the tests for internal helper functions */
|
||
|
testhelper_is_whitespace_normalized();
|
||
|
|
||
|
for (i = 1; i < argc; ++i) {
|
||
|
char *opt = argv[i];
|
||
|
if (strcmp(opt, "-v") == 0 || strcmp(opt, "--verbose") == 0)
|
||
|
verbosity = CK_VERBOSE;
|
||
|
else if (strcmp(opt, "-q") == 0 || strcmp(opt, "--quiet") == 0)
|
||
|
verbosity = CK_SILENT;
|
||
|
else {
|
||
|
fprintf(stderr, "runtests: unknown option '%s'\n", opt);
|
||
|
return 2;
|
||
|
}
|
||
|
}
|
||
|
if (verbosity != CK_SILENT)
|
||
|
printf("Expat version: %s\n", XML_ExpatVersion());
|
||
|
srunner_run_all(sr, verbosity);
|
||
|
nf = srunner_ntests_failed(sr);
|
||
|
srunner_free(sr);
|
||
|
|
||
|
return (nf == 0) ? EXIT_SUCCESS : EXIT_FAILURE;
|
||
|
}
|