libexpat/expat/tests/runtests.c

#include <assert.h>
#include <check.h>
#include <stdlib.h>
#include <stdio.h>
#include <string.h>

#include "expat.h"


static XML_Parser parser;


static void
basic_setup(void)
{
    parser = XML_ParserCreate(NULL);
    if (parser == NULL)
        fail("Parser not created.");
}

static void
basic_teardown(void)
{
    if (parser != NULL)
        XML_ParserFree(parser);
}

/* Generate a failure using the parser state to create an error message;
 * this should be used when the parser reports and error we weren't
 * expecting.
 */
static void
_xml_failure(const char *file, int line)
{
    char buffer[1024];
    sprintf(buffer, "%s (line %d, offset %d)\n    reported from %s, line %d",
            XML_ErrorString(XML_GetErrorCode(parser)),
            XML_GetCurrentLineNumber(parser),
            XML_GetCurrentColumnNumber(parser),
            file, line);
    fail(buffer);
}

#define xml_failure() _xml_failure(__FILE__, __LINE__)

START_TEST(test_nul_byte)
{
    char text[] = "<doc>\0</doc>";

    /* test that a NUL byte (in US-ASCII data) is an error */
    if (XML_Parse(parser, text, sizeof(text) - 1, 1))
        fail("Parser did not report error on NUL-byte.");
    if (XML_GetErrorCode(parser) != XML_ERROR_INVALID_TOKEN)
        xml_failure();
}
END_TEST


START_TEST(test_u0000_char)
{
    char *text = "<doc>&#0;</doc>";

    /* test that a NUL byte (in US-ASCII data) is an error */
    if (XML_Parse(parser, text, strlen(text), 1))
        fail("Parser did not report error on NUL-byte.");
    if (XML_GetErrorCode(parser) != XML_ERROR_BAD_CHAR_REF)
        xml_failure();
}
END_TEST


START_TEST(test_xmldecl_misplaced)
{
    char *text =
        "\n"
        "<?xml version='1.0'?>\n"
        "<a>&eee;</a>";

    if (!XML_Parse(parser, text, strlen(text), 1)) {
        if (XML_GetErrorCode(parser) != XML_ERROR_MISPLACED_XML_PI)
            xml_failure();
    }
    else {
        fail("expected XML_ERROR_MISPLACED_XML_PI with misplaced XML decl");
    }
}
END_TEST

START_TEST(test_bom_utf8)
{
    /* This test is really just making sure we don't core on a UTF-8 BOM. */
    char *text = "\357\273\277<e/>";

    if (!XML_Parse(parser, text, strlen(text), 1))
        xml_failure();
}
END_TEST

START_TEST(test_bom_utf16_be)
{
    char text[] = "\376\377\0<\0e\0/\0>";

    if (!XML_Parse(parser, text, sizeof(text) - 1, 1))
        xml_failure();
}
END_TEST

START_TEST(test_bom_utf16_le)
{
    char text[] = "\377\376<\0e\0/\0>\0";

    if (!XML_Parse(parser, text, sizeof(text) - 1, 1))
        xml_failure();
}
END_TEST


typedef struct 
{
    int count;
    XML_Char data[1024];
} CharData;

static void
accumulate_characters(void *userData, const XML_Char *s, int len)
{
    CharData *storage = (CharData *)userData;
    if (len + storage->count < sizeof(storage->data)) {
        memcpy(storage->data + storage->count, s, len);
        storage->count += len;
    }
}

static void
check_characters(CharData *storage, XML_Char *expected)
{
    char buffer[1024];
    int len = strlen(expected);
    if (len != storage->count) {
        sprintf(buffer, "wrong number of data characters: got %d, expected %d",
                storage->count, len);
        fail(buffer);
        return;
    }
    if (memcmp(expected, storage->data, len) != 0)
        fail("got bad data bytes");
}

static void
run_character_check(XML_Char *text, XML_Char *expected)
{
    CharData storage;
    storage.count = 0;
    XML_SetUserData(parser, &storage);
    XML_SetCharacterDataHandler(parser, accumulate_characters);
    if (!XML_Parse(parser, text, strlen(text), 1))
        xml_failure();
    check_characters(&storage, expected);
}

/* Regression test for SF bug #491986. */
START_TEST(test_danish_latin1)
{
    char *text =
        "<?xml version='1.0' encoding='iso-8859-1'?>\n"
        "<e>J<>rgen <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD></e>";
    run_character_check(text,
             "J\xC3\xB8rgen \xC3\xA6\xC3\xB8\xC3\xA5\xC3\x86\xC3\x98\xC3\x85");
}
END_TEST
/* End regression test for SF bug #491986. */


/* Regression test for SF bug #514281. */
START_TEST(test_french_charref_hexidecimal)
{
    char *text =
        "<?xml version='1.0' encoding='iso-8859-1'?>\n"
        "<doc>&#xE9;&#xE8;&#xE0;&#xE7;&#xEA;&#xC8;</doc>";
    run_character_check(text,
                        "\xC3\xA9\xC3\xA8\xC3\xA0\xC3\xA7\xC3\xAA\xC3\x88");
}
END_TEST

START_TEST(test_french_charref_decimal)
{
    char *text =
        "<?xml version='1.0' encoding='iso-8859-1'?>\n"
        "<doc>&#233;&#232;&#224;&#231;&#234;&#200;</doc>";
    run_character_check(text,
                        "\xC3\xA9\xC3\xA8\xC3\xA0\xC3\xA7\xC3\xAA\xC3\x88");
}
END_TEST

START_TEST(test_french_latin1)
{
    char *text =
        "<?xml version='1.0' encoding='iso-8859-1'?>\n"
        "<doc>\xE9\xE8\xE0\xE7\xEa\xC8</doc>";
    run_character_check(text,
                        "\xC3\xA9\xC3\xA8\xC3\xA0\xC3\xA7\xC3\xAA\xC3\x88");
}
END_TEST

START_TEST(test_french_utf8)
{
    char *text =
        "<?xml version='1.0' encoding='utf-8'?>\n"
        "<doc>\xC3\xA9</doc>";
    run_character_check(text, "\xC3\xA9");
}
END_TEST
/* End regression test for SF bug #514281. */


/* Helpers used by the following test; this checks any "attr" and "refs"
 * attributes to make sure whitespace has been normalized.
 */

/* Return true if whitespace has been normalized in a string, using
 * the rules for attribute value normalization.  The 'is_cdata' flag
 * is needed since CDATA attributes don't need to have multiple
 * whitespace characters collapsed to a single space, while other
 * attribute data types do.  (Section 3.3.3 of the recommendation.)
 */
static int
is_whitespace_normalized(const XML_Char *s, int is_cdata)
{
    int blanks = 0;
    int at_start = 1;
    while (*s) {
        if (*s == ' ')
            ++blanks;
        else if (*s == '\t' || *s == '\n' || *s == '\r')
            return 0;
        else {
            if (at_start) {
                at_start = 0;
                if (blanks && !is_cdata)
                    /* illegal leading blanks */
                    return 0;
            }
            else if (blanks > 1 && !is_cdata)
                return 0;
            blanks = 0;
        }
        ++s;
    }
    if (blanks && !is_cdata)
        return 0;
    return 1;
}

/* Check the attribute whitespace checker: */
static void
testhelper_is_whitespace_normalized(void)
{
    assert(is_whitespace_normalized("abc", 0));
    assert(is_whitespace_normalized("abc", 1));
    assert(is_whitespace_normalized("abc def ghi", 0));
    assert(is_whitespace_normalized("abc def ghi", 1));
    assert(!is_whitespace_normalized(" abc def ghi", 0));
    assert(is_whitespace_normalized(" abc def ghi", 1));
    assert(!is_whitespace_normalized("abc  def ghi", 0));
    assert(is_whitespace_normalized("abc  def ghi", 1));
    assert(!is_whitespace_normalized("abc def ghi ", 0));
    assert(is_whitespace_normalized("abc def ghi ", 1));
    assert(!is_whitespace_normalized(" ", 0));
    assert(is_whitespace_normalized(" ", 1));
    assert(!is_whitespace_normalized("\t", 0));
    assert(!is_whitespace_normalized("\t", 1));
    assert(!is_whitespace_normalized("\n", 0));
    assert(!is_whitespace_normalized("\n", 1));
    assert(!is_whitespace_normalized("\r", 0));
    assert(!is_whitespace_normalized("\r", 1));
    assert(!is_whitespace_normalized("abc\t def", 1));
}

static void
check_attr_contains_normalized_whitespace(void *userdata,
                                          const XML_Char *name,
                                          const XML_Char **atts)
{
    int i;
    for (i = 0; atts[i] != NULL; i += 2) {
        const XML_Char *attrname = atts[i];
        const XML_Char *value = atts[i + 1];
        if (strcmp("attr", attrname) == 0
            || strcmp("ents", attrname) == 0
            || strcmp("refs", attrname) == 0) {
            if (!is_whitespace_normalized(value, 0)) {
                char buffer[256];
                sprintf(buffer, "attribute value not normalized: %s='%s'",
                        attrname, value);
                fail(buffer);
            }
        }
    }
}

START_TEST(test_attr_whitespace_normalization)
{
    char *text =
        "<!DOCTYPE doc [\n"
        "  <!ATTLIST doc\n"
        "            attr NMTOKENS #REQUIRED\n"
        "            ents ENTITIES #REQUIRED\n"
        "            refs IDREFS   #REQUIRED>\n"
        "]>\n"
        "<doc attr='    a  b c\t\td\te\t' refs=' id-1   \t  id-2\t\t'  \n"
        "     ents=' ent-1   \t\r\n"
        "            ent-2  ' >\n"
        "  <e id='id-1'/>\n"
        "  <e id='id-2'/>\n"
        "</doc>";

    XML_SetStartElementHandler(parser,
                               check_attr_contains_normalized_whitespace);
    if (!XML_Parse(parser, text, strlen(text), 1))
        xml_failure();
}
END_TEST


static Suite *
make_basic_suite(void)
{
    Suite *s = suite_create("basic");
    TCase *tc_chars = tcase_create("character tests");
    TCase *tc_attrs = tcase_create("attributes");
    TCase *tc_xmldecl = tcase_create("XML declaration");

    suite_add_tcase(s, tc_chars);
    tcase_add_checked_fixture(tc_chars, basic_setup, basic_teardown);
    tcase_add_test(tc_chars, test_nul_byte);
    tcase_add_test(tc_chars, test_u0000_char);
    tcase_add_test(tc_chars, test_bom_utf8);
    tcase_add_test(tc_chars, test_bom_utf16_be);
    tcase_add_test(tc_chars, test_bom_utf16_le);
    /* Regression test for SF bug #491986. */
    tcase_add_test(tc_chars, test_danish_latin1);
    /* Regression test for SF bug #514281. */
    tcase_add_test(tc_chars, test_french_charref_hexidecimal);
    tcase_add_test(tc_chars, test_french_charref_decimal);
    tcase_add_test(tc_chars, test_french_latin1);
    tcase_add_test(tc_chars, test_french_utf8);

    suite_add_tcase(s, tc_attrs);
    tcase_add_checked_fixture(tc_attrs, basic_setup, basic_teardown);
    tcase_add_test(tc_attrs, test_attr_whitespace_normalization);

    suite_add_tcase(s, tc_xmldecl);
    tcase_add_checked_fixture(tc_xmldecl, basic_setup, basic_teardown);
    tcase_add_test(tc_xmldecl, test_xmldecl_misplaced);

    return s;
}


int
main(int argc, char *argv[])
{
    int i, nf;
    int forking = 0, forking_set = 0;
    int verbosity = CK_NORMAL;
    Suite *s = make_basic_suite();
    SRunner *sr = srunner_create(s);

    /* run the tests for internal helper functions */
    testhelper_is_whitespace_normalized();

    for (i = 1; i < argc; ++i) {
        char *opt = argv[i];
        if (strcmp(opt, "-v") == 0 || strcmp(opt, "--verbose") == 0)
            verbosity = CK_VERBOSE;
        else if (strcmp(opt, "-q") == 0 || strcmp(opt, "--quiet") == 0)
            verbosity = CK_SILENT;
        else if (strcmp(opt, "-f") == 0 || strcmp(opt, "--fork") == 0) {
            forking = 1;
            forking_set = 1;
        }
        else if (strcmp(opt, "-n") == 0 || strcmp(opt, "--no-fork") == 0) {
            forking = 0;
            forking_set = 1;
        }
        else {
            fprintf(stderr, "runtests: unknown option '%s'\n", opt);
            return 2;
        }
    }
    if (forking_set)
        srunner_set_fork_status(sr, forking ? CK_FORK : CK_NOFORK);
    srunner_run_all(sr, verbosity);
    nf = srunner_ntests_failed(sr);
    srunner_free(sr);
    suite_free(s);

    return (nf == 0) ? EXIT_SUCCESS : EXIT_FAILURE;
}
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								#include <assert.h>
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								#include <check.h>
 								#include <stdlib.h>
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								#include <stdio.h>
-												basic_setup():  Remove bogus assumption that all tests would use US-ASCII
    data; let Expat determine the proper encoding from the XML source text.

Added several tests relating to supposed mis-interpretation of Latin-1;
these show that Expat (at least in the CVS version) is properly decoding
the Latin-1 text and generating the proper UTF-8 output.

This closes SF bug #491986, #514281.

											
										
										
											2002-04-19 14:25:07 -04:00
+								#include <string.h>
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
 								#include "expat.h"
 								static XML_Parser parser;
 								static void
 								basic_setup(void)
 								{
-												basic_setup():  Remove bogus assumption that all tests would use US-ASCII
    data; let Expat determine the proper encoding from the XML source text.

Added several tests relating to supposed mis-interpretation of Latin-1;
these show that Expat (at least in the CVS version) is properly decoding
the Latin-1 text and generating the proper UTF-8 output.

This closes SF bug #491986, #514281.

											
										
										
											2002-04-19 14:25:07 -04:00
+								    parser = XML_ParserCreate(NULL);
-												Update to work with check 0.8.

											
										
										
											2001-11-13 00:04:02 -05:00
+								    if (parser == NULL)
 								        fail("Parser not created.");
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								}
 								static void
 								basic_teardown(void)
 								{
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								    if (parser != NULL)
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								        XML_ParserFree(parser);
 								}
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								/* Generate a failure using the parser state to create an error message;
 								 * this should be used when the parser reports and error we weren't
 								 * expecting.
 								 */
 								static void
-												basic_setup():  Remove bogus assumption that all tests would use US-ASCII
    data; let Expat determine the proper encoding from the XML source text.

Added several tests relating to supposed mis-interpretation of Latin-1;
these show that Expat (at least in the CVS version) is properly decoding
the Latin-1 text and generating the proper UTF-8 output.

This closes SF bug #491986, #514281.

											
										
										
											2002-04-19 14:25:07 -04:00
+								_xml_failure(const char *file, int line)
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								{
-												basic_setup():  Remove bogus assumption that all tests would use US-ASCII
    data; let Expat determine the proper encoding from the XML source text.

Added several tests relating to supposed mis-interpretation of Latin-1;
these show that Expat (at least in the CVS version) is properly decoding
the Latin-1 text and generating the proper UTF-8 output.

This closes SF bug #491986, #514281.

											
										
										
											2002-04-19 14:25:07 -04:00
+								    char buffer[1024];
 								    sprintf(buffer, "%s (line %d, offset %d)\n    reported from %s, line %d",
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								            XML_ErrorString(XML_GetErrorCode(parser)),
 								            XML_GetCurrentLineNumber(parser),
-												basic_setup():  Remove bogus assumption that all tests would use US-ASCII
    data; let Expat determine the proper encoding from the XML source text.

Added several tests relating to supposed mis-interpretation of Latin-1;
these show that Expat (at least in the CVS version) is properly decoding
the Latin-1 text and generating the proper UTF-8 output.

This closes SF bug #491986, #514281.

											
										
										
											2002-04-19 14:25:07 -04:00
+								            XML_GetCurrentColumnNumber(parser),
 								            file, line);
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								    fail(buffer);
 								}
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
-												basic_setup():  Remove bogus assumption that all tests would use US-ASCII
    data; let Expat determine the proper encoding from the XML source text.

Added several tests relating to supposed mis-interpretation of Latin-1;
these show that Expat (at least in the CVS version) is properly decoding
the Latin-1 text and generating the proper UTF-8 output.

This closes SF bug #491986, #514281.

											
										
										
											2002-04-19 14:25:07 -04:00
+								#define xml_failure() _xml_failure(__FILE__, __LINE__)
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								START_TEST(test_nul_byte)
 								{
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								    char text[] = "<doc>\0</doc>";
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
 								    /* test that a NUL byte (in US-ASCII data) is an error */
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								    if (XML_Parse(parser, text, sizeof(text) - 1, 1))
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								        fail("Parser did not report error on NUL-byte.");
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								    if (XML_GetErrorCode(parser) != XML_ERROR_INVALID_TOKEN)
 								        xml_failure();
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								}
 								END_TEST
 								START_TEST(test_u0000_char)
 								{
 								    char *text = "<doc>&#0;</doc>";
 								    /* test that a NUL byte (in US-ASCII data) is an error */
 								    if (XML_Parse(parser, text, strlen(text), 1))
 								        fail("Parser did not report error on NUL-byte.");
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								    if (XML_GetErrorCode(parser) != XML_ERROR_BAD_CHAR_REF)
 								        xml_failure();
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								}
 								END_TEST
-												Added a test that ensures the parser reports an out-of-place XML declaration.
(Originally written to attempt to tickle a different bug, but useful as a
regression test even though Expat has been doing the right thing.)

											
										
										
											2001-11-12 23:49:52 -05:00
+								START_TEST(test_xmldecl_misplaced)
 								{
 								    char *text =
 								        "\n"
 								        "<?xml version='1.0'?>\n"
 								        "<a>&eee;</a>";
 								    if (!XML_Parse(parser, text, strlen(text), 1)) {
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								        if (XML_GetErrorCode(parser) != XML_ERROR_MISPLACED_XML_PI)
 								            xml_failure();
-												Added a test that ensures the parser reports an out-of-place XML declaration.
(Originally written to attempt to tickle a different bug, but useful as a
regression test even though Expat has been doing the right thing.)

											
										
										
											2001-11-12 23:49:52 -05:00
+								    }
 								    else {
 								        fail("expected XML_ERROR_MISPLACED_XML_PI with misplaced XML decl");
 								    }
 								}
 								END_TEST
-												Added tests that some basic encodings are recognized and the corresponding
BOM marks do not cause core dumps.  The UTF-8 BOM bug was fixed a while ago,
but a regression test is always a good idea.

											
										
										
											2001-11-13 12:31:53 -05:00
+								START_TEST(test_bom_utf8)
 								{
 								    /* This test is really just making sure we don't core on a UTF-8 BOM. */
 								    char *text = "\357\273\277<e/>";
 								    if (!XML_Parse(parser, text, strlen(text), 1))
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								        xml_failure();
-												Added tests that some basic encodings are recognized and the corresponding
BOM marks do not cause core dumps.  The UTF-8 BOM bug was fixed a while ago,
but a regression test is always a good idea.

											
										
										
											2001-11-13 12:31:53 -05:00
+								}
 								END_TEST
 								START_TEST(test_bom_utf16_be)
 								{
 								    char text[] = "\376\377\0<\0e\0/\0>";
 								    if (!XML_Parse(parser, text, sizeof(text) - 1, 1))
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								        xml_failure();
-												Added tests that some basic encodings are recognized and the corresponding
BOM marks do not cause core dumps.  The UTF-8 BOM bug was fixed a while ago,
but a regression test is always a good idea.

											
										
										
											2001-11-13 12:31:53 -05:00
+								}
 								END_TEST
 								START_TEST(test_bom_utf16_le)
 								{
 								    char text[] = "\377\376<\0e\0/\0>\0";
 								    if (!XML_Parse(parser, text, sizeof(text) - 1, 1))
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								        xml_failure();
-												Added tests that some basic encodings are recognized and the corresponding
BOM marks do not cause core dumps.  The UTF-8 BOM bug was fixed a while ago,
but a regression test is always a good idea.

											
										
										
											2001-11-13 12:31:53 -05:00
+								}
 								END_TEST
-												Added a test that ensures the parser reports an out-of-place XML declaration.
(Originally written to attempt to tickle a different bug, but useful as a
regression test even though Expat has been doing the right thing.)

											
										
										
											2001-11-12 23:49:52 -05:00
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
-												basic_setup():  Remove bogus assumption that all tests would use US-ASCII
    data; let Expat determine the proper encoding from the XML source text.

Added several tests relating to supposed mis-interpretation of Latin-1;
these show that Expat (at least in the CVS version) is properly decoding
the Latin-1 text and generating the proper UTF-8 output.

This closes SF bug #491986, #514281.

											
										
										
											2002-04-19 14:25:07 -04:00
+								typedef struct
 								{
 								    int count;
 								    XML_Char data[1024];
 								} CharData;
 								static void
 								accumulate_characters(void *userData, const XML_Char *s, int len)
 								{
 								    CharData *storage = (CharData *)userData;
 								    if (len + storage->count < sizeof(storage->data)) {
 								        memcpy(storage->data + storage->count, s, len);
 								        storage->count += len;
 								    }
 								}
 								static void
 								check_characters(CharData *storage, XML_Char *expected)
 								{
 								    char buffer[1024];
 								    int len = strlen(expected);
 								    if (len != storage->count) {
 								        sprintf(buffer, "wrong number of data characters: got %d, expected %d",
 								                storage->count, len);
 								        fail(buffer);
 								        return;
 								    }
 								    if (memcmp(expected, storage->data, len) != 0)
 								        fail("got bad data bytes");
 								}
 								static void
 								run_character_check(XML_Char *text, XML_Char *expected)
 								{
 								    CharData storage;
 								    storage.count = 0;
 								    XML_SetUserData(parser, &storage);
 								    XML_SetCharacterDataHandler(parser, accumulate_characters);
 								    if (!XML_Parse(parser, text, strlen(text), 1))
 								        xml_failure();
 								    check_characters(&storage, expected);
 								}
 								/* Regression test for SF bug #491986. */
 								START_TEST(test_danish_latin1)
 								{
 								    char *text =
 								        "<?xml version='1.0' encoding='iso-8859-1'?>\n"
 								        "<e>J<>rgen <20><><EFBFBD><EFBFBD><EFBFBD><EFBFBD></e>";
 								    run_character_check(text,
 								             "J\xC3\xB8rgen \xC3\xA6\xC3\xB8\xC3\xA5\xC3\x86\xC3\x98\xC3\x85");
 								}
 								END_TEST
 								/* End regression test for SF bug #491986. */
 								/* Regression test for SF bug #514281. */
 								START_TEST(test_french_charref_hexidecimal)
 								{
 								    char *text =
 								        "<?xml version='1.0' encoding='iso-8859-1'?>\n"
 								        "<doc>&#xE9;&#xE8;&#xE0;&#xE7;&#xEA;&#xC8;</doc>";
 								    run_character_check(text,
 								                        "\xC3\xA9\xC3\xA8\xC3\xA0\xC3\xA7\xC3\xAA\xC3\x88");
 								}
 								END_TEST
 								START_TEST(test_french_charref_decimal)
 								{
 								    char *text =
 								        "<?xml version='1.0' encoding='iso-8859-1'?>\n"
 								        "<doc>&#233;&#232;&#224;&#231;&#234;&#200;</doc>";
 								    run_character_check(text,
 								                        "\xC3\xA9\xC3\xA8\xC3\xA0\xC3\xA7\xC3\xAA\xC3\x88");
 								}
 								END_TEST
 								START_TEST(test_french_latin1)
 								{
 								    char *text =
 								        "<?xml version='1.0' encoding='iso-8859-1'?>\n"
 								        "<doc>\xE9\xE8\xE0\xE7\xEa\xC8</doc>";
 								    run_character_check(text,
 								                        "\xC3\xA9\xC3\xA8\xC3\xA0\xC3\xA7\xC3\xAA\xC3\x88");
 								}
 								END_TEST
 								START_TEST(test_french_utf8)
 								{
 								    char *text =
 								        "<?xml version='1.0' encoding='utf-8'?>\n"
 								        "<doc>\xC3\xA9</doc>";
 								    run_character_check(text, "\xC3\xA9");
 								}
 								END_TEST
 								/* End regression test for SF bug #514281. */
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								/* Helpers used by the following test; this checks any "attr" and "refs"
 								 * attributes to make sure whitespace has been normalized.
 								 */
 								/* Return true if whitespace has been normalized in a string, using
 								 * the rules for attribute value normalization.  The 'is_cdata' flag
 								 * is needed since CDATA attributes don't need to have multiple
 								 * whitespace characters collapsed to a single space, while other
 								 * attribute data types do.  (Section 3.3.3 of the recommendation.)
 								 */
 								static int
 								is_whitespace_normalized(const XML_Char *s, int is_cdata)
 								{
 								    int blanks = 0;
 								    int at_start = 1;
 								    while (*s) {
 								        if (*s == ' ')
 								            ++blanks;
 								        else if (*s == '\t' || *s == '\n' || *s == '\r')
 								            return 0;
 								        else {
 								            if (at_start) {
 								                at_start = 0;
 								                if (blanks && !is_cdata)
 								                    /* illegal leading blanks */
 								                    return 0;
 								            }
 								            else if (blanks > 1 && !is_cdata)
 								                return 0;
 								            blanks = 0;
 								        }
 								        ++s;
 								    }
 								    if (blanks && !is_cdata)
 								        return 0;
 								    return 1;
 								}
 								/* Check the attribute whitespace checker: */
 								static void
 								testhelper_is_whitespace_normalized(void)
 								{
 								    assert(is_whitespace_normalized("abc", 0));
 								    assert(is_whitespace_normalized("abc", 1));
 								    assert(is_whitespace_normalized("abc def ghi", 0));
 								    assert(is_whitespace_normalized("abc def ghi", 1));
 								    assert(!is_whitespace_normalized(" abc def ghi", 0));
 								    assert(is_whitespace_normalized(" abc def ghi", 1));
 								    assert(!is_whitespace_normalized("abc  def ghi", 0));
 								    assert(is_whitespace_normalized("abc  def ghi", 1));
 								    assert(!is_whitespace_normalized("abc def ghi ", 0));
 								    assert(is_whitespace_normalized("abc def ghi ", 1));
 								    assert(!is_whitespace_normalized(" ", 0));
 								    assert(is_whitespace_normalized(" ", 1));
 								    assert(!is_whitespace_normalized("\t", 0));
 								    assert(!is_whitespace_normalized("\t", 1));
 								    assert(!is_whitespace_normalized("\n", 0));
 								    assert(!is_whitespace_normalized("\n", 1));
 								    assert(!is_whitespace_normalized("\r", 0));
 								    assert(!is_whitespace_normalized("\r", 1));
 								    assert(!is_whitespace_normalized("abc\t def", 1));
 								}
 								static void
 								check_attr_contains_normalized_whitespace(void *userdata,
 								                                          const XML_Char *name,
 								                                          const XML_Char **atts)
 								{
 								    int i;
 								    for (i = 0; atts[i] != NULL; i += 2) {
 								        const XML_Char *attrname = atts[i];
 								        const XML_Char *value = atts[i + 1];
 								        if (strcmp("attr", attrname) == 0
 								            || strcmp("ents", attrname) == 0
 								            || strcmp("refs", attrname) == 0) {
 								            if (!is_whitespace_normalized(value, 0)) {
 								                char buffer[256];
 								                sprintf(buffer, "attribute value not normalized: %s='%s'",
 								                        attrname, value);
 								                fail(buffer);
 								            }
 								        }
 								    }
 								}
 								START_TEST(test_attr_whitespace_normalization)
 								{
 								    char *text =
 								        "<!DOCTYPE doc [\n"
 								        "  <!ATTLIST doc\n"
 								        "            attr NMTOKENS #REQUIRED\n"
 								        "            ents ENTITIES #REQUIRED\n"
 								        "            refs IDREFS   #REQUIRED>\n"
 								        "]>\n"
 								        "<doc attr='    a  b c\t\td\te\t' refs=' id-1   \t  id-2\t\t'  \n"
 								        "     ents=' ent-1   \t\r\n"
 								        "            ent-2  ' >\n"
 								        "  <e id='id-1'/>\n"
 								        "  <e id='id-2'/>\n"
 								        "</doc>";
 								    XML_SetStartElementHandler(parser,
 								                               check_attr_contains_normalized_whitespace);
 								    if (!XML_Parse(parser, text, strlen(text), 1))
 								        xml_failure();
 								}
 								END_TEST
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								static Suite *
 								make_basic_suite(void)
 								{
 								    Suite *s = suite_create("basic");
-												Added tests that some basic encodings are recognized and the corresponding
BOM marks do not cause core dumps.  The UTF-8 BOM bug was fixed a while ago,
but a regression test is always a good idea.

											
										
										
											2001-11-13 12:31:53 -05:00
+								    TCase *tc_chars = tcase_create("character tests");
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								    TCase *tc_attrs = tcase_create("attributes");
-												Added a test that ensures the parser reports an out-of-place XML declaration.
(Originally written to attempt to tickle a different bug, but useful as a
regression test even though Expat has been doing the right thing.)

											
										
										
											2001-11-12 23:49:52 -05:00
+								    TCase *tc_xmldecl = tcase_create("XML declaration");
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
-												Added tests that some basic encodings are recognized and the corresponding
BOM marks do not cause core dumps.  The UTF-8 BOM bug was fixed a while ago,
but a regression test is always a good idea.

											
										
										
											2001-11-13 12:31:53 -05:00
+								    suite_add_tcase(s, tc_chars);
 								    tcase_add_checked_fixture(tc_chars, basic_setup, basic_teardown);
 								    tcase_add_test(tc_chars, test_nul_byte);
 								    tcase_add_test(tc_chars, test_u0000_char);
 								    tcase_add_test(tc_chars, test_bom_utf8);
 								    tcase_add_test(tc_chars, test_bom_utf16_be);
 								    tcase_add_test(tc_chars, test_bom_utf16_le);
-												basic_setup():  Remove bogus assumption that all tests would use US-ASCII
    data; let Expat determine the proper encoding from the XML source text.

Added several tests relating to supposed mis-interpretation of Latin-1;
these show that Expat (at least in the CVS version) is properly decoding
the Latin-1 text and generating the proper UTF-8 output.

This closes SF bug #491986, #514281.

											
										
										
											2002-04-19 14:25:07 -04:00
+								    /* Regression test for SF bug #491986. */
 								    tcase_add_test(tc_chars, test_danish_latin1);
 								    /* Regression test for SF bug #514281. */
-												Add the new tests to the right TCase object.

											
										
										
											2002-04-19 14:50:26 -04:00
+								    tcase_add_test(tc_chars, test_french_charref_hexidecimal);
 								    tcase_add_test(tc_chars, test_french_charref_decimal);
 								    tcase_add_test(tc_chars, test_french_latin1);
 								    tcase_add_test(tc_chars, test_french_utf8);
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								    suite_add_tcase(s, tc_attrs);
 								    tcase_add_checked_fixture(tc_attrs, basic_setup, basic_teardown);
 								    tcase_add_test(tc_attrs, test_attr_whitespace_normalization);
-												Added a test that ensures the parser reports an out-of-place XML declaration.
(Originally written to attempt to tickle a different bug, but useful as a
regression test even though Expat has been doing the right thing.)

											
										
										
											2001-11-12 23:49:52 -05:00
+								    suite_add_tcase(s, tc_xmldecl);
-												Update to work with check 0.8.

											
										
										
											2001-11-13 00:04:02 -05:00
+								    tcase_add_checked_fixture(tc_xmldecl, basic_setup, basic_teardown);
-												Added a test that ensures the parser reports an out-of-place XML declaration.
(Originally written to attempt to tickle a different bug, but useful as a
regression test even though Expat has been doing the right thing.)

											
										
										
											2001-11-12 23:49:52 -05:00
+								    tcase_add_test(tc_xmldecl, test_xmldecl_misplaced);
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								    return s;
 								}
 								int
 								main(int argc, char *argv[])
 								{
-												Added tests that some basic encodings are recognized and the corresponding
BOM marks do not cause core dumps.  The UTF-8 BOM bug was fixed a while ago,
but a regression test is always a good idea.

											
										
										
											2001-11-13 12:31:53 -05:00
+								    int i, nf;
 								    int forking = 0, forking_set = 0;
-												Update to work with check 0.8.

											
										
										
											2001-11-13 00:04:02 -05:00
+								    int verbosity = CK_NORMAL;
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								    Suite *s = make_basic_suite();
 								    SRunner *sr = srunner_create(s);
-												Added a test to make sure that whitespace in ENTITIES, IDREFS, and NMTOKENS
attributes is properly collapsed according to Section 3.3.3 of the spec.
This is the first even slightly complicated test; boy are these painful in
C!  Had to add a test of a helper routine as well; that just uses assertions
since the test framework should not be dealing with tests of the tester,
just of Expat.

Added a helper to make the failure messages more useful when Expat produces
an unexpected error code; we now include the error message and location from
Expat.  This is mostly useful when developing a new test.

											
										
										
											2001-11-16 15:19:39 -05:00
+								    /* run the tests for internal helper functions */
 								    testhelper_is_whitespace_normalized();
-												Added tests that some basic encodings are recognized and the corresponding
BOM marks do not cause core dumps.  The UTF-8 BOM bug was fixed a while ago,
but a regression test is always a good idea.

											
										
										
											2001-11-13 12:31:53 -05:00
+								    for (i = 1; i < argc; ++i) {
 								        char *opt = argv[i];
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								        if (strcmp(opt, "-v") == 0 || strcmp(opt, "--verbose") == 0)
-												Update to work with check 0.8.

											
										
										
											2001-11-13 00:04:02 -05:00
+								            verbosity = CK_VERBOSE;
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								        else if (strcmp(opt, "-q") == 0 || strcmp(opt, "--quiet") == 0)
-												Update to work with check 0.8.

											
										
										
											2001-11-13 00:04:02 -05:00
+								            verbosity = CK_SILENT;
-												Added tests that some basic encodings are recognized and the corresponding
BOM marks do not cause core dumps.  The UTF-8 BOM bug was fixed a while ago,
but a regression test is always a good idea.

											
										
										
											2001-11-13 12:31:53 -05:00
+								        else if (strcmp(opt, "-f") == 0 || strcmp(opt, "--fork") == 0) {
 								            forking = 1;
 								            forking_set = 1;
 								        }
 								        else if (strcmp(opt, "-n") == 0 || strcmp(opt, "--no-fork") == 0) {
 								            forking = 0;
 								            forking_set = 1;
 								        }
-												Add a check for unknown command line options.

											
										
										
											2001-11-18 08:56:01 -05:00
+								        else {
 								            fprintf(stderr, "runtests: unknown option '%s'\n", opt);
 								            return 2;
 								        }
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								    }
-												Added tests that some basic encodings are recognized and the corresponding
BOM marks do not cause core dumps.  The UTF-8 BOM bug was fixed a while ago,
but a regression test is always a good idea.

											
										
										
											2001-11-13 12:31:53 -05:00
+								    if (forking_set)
 								        srunner_set_fork_status(sr, forking ? CK_FORK : CK_NOFORK);
-A very small test suite for Expat; additional tests will be added as time
permits.

											
										
										
											2001-08-17 15:16:41 -04:00
+								    srunner_run_all(sr, verbosity);
 								    nf = srunner_ntests_failed(sr);
 								    srunner_free(sr);
 								    suite_free(s);
 								    return (nf == 0) ? EXIT_SUCCESS : EXIT_FAILURE;
 								}