123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402 |
- /*
- * testRegexp.c: simple module for testing regular expressions
- *
- * See Copyright for the status of this software.
- *
- * Daniel Veillard <veillard@redhat.com>
- */
- #include "libxml.h"
- #ifdef LIBXML_REGEXP_ENABLED
- #include <string.h>
- #include <libxml/tree.h>
- #include <libxml/xmlregexp.h>
- static int repeat = 0;
- static int debug = 0;
- static void testRegexp(xmlRegexpPtr comp, const char *value) {
- int ret;
- ret = xmlRegexpExec(comp, (const xmlChar *) value);
- if (ret == 1)
- printf("%s: Ok\n", value);
- else if (ret == 0)
- printf("%s: Fail\n", value);
- else
- printf("%s: Error: %d\n", value, ret);
- if (repeat) {
- int j;
- for (j = 0;j < 999999;j++)
- xmlRegexpExec(comp, (const xmlChar *) value);
- }
- }
- static void
- testRegexpFile(const char *filename) {
- xmlRegexpPtr comp = NULL;
- FILE *input;
- char expression[5000];
- int len;
- input = fopen(filename, "r");
- if (input == NULL) {
- xmlGenericError(xmlGenericErrorContext,
- "Cannot open %s for reading\n", filename);
- return;
- }
- while (fgets(expression, 4500, input) != NULL) {
- len = strlen(expression);
- len--;
- while ((len >= 0) &&
- ((expression[len] == '\n') || (expression[len] == '\t') ||
- (expression[len] == '\r') || (expression[len] == ' '))) len--;
- expression[len + 1] = 0;
- if (len >= 0) {
- if (expression[0] == '#')
- continue;
- if ((expression[0] == '=') && (expression[1] == '>')) {
- char *pattern = &expression[2];
- if (comp != NULL) {
- xmlRegFreeRegexp(comp);
- comp = NULL;
- }
- printf("Regexp: %s\n", pattern) ;
- comp = xmlRegexpCompile((const xmlChar *) pattern);
- if (comp == NULL) {
- printf(" failed to compile\n");
- break;
- }
- } else if (comp == NULL) {
- printf("Regexp: %s\n", expression) ;
- comp = xmlRegexpCompile((const xmlChar *) expression);
- if (comp == NULL) {
- printf(" failed to compile\n");
- break;
- }
- } else if (comp != NULL) {
- testRegexp(comp, expression);
- }
- }
- }
- fclose(input);
- if (comp != NULL)
- xmlRegFreeRegexp(comp);
- }
- #ifdef LIBXML_EXPR_ENABLED
- static void
- runFileTest(xmlExpCtxtPtr ctxt, const char *filename) {
- xmlExpNodePtr expr = NULL, sub;
- FILE *input;
- char expression[5000];
- int len;
- input = fopen(filename, "r");
- if (input == NULL) {
- xmlGenericError(xmlGenericErrorContext,
- "Cannot open %s for reading\n", filename);
- return;
- }
- while (fgets(expression, 4500, input) != NULL) {
- len = strlen(expression);
- len--;
- while ((len >= 0) &&
- ((expression[len] == '\n') || (expression[len] == '\t') ||
- (expression[len] == '\r') || (expression[len] == ' '))) len--;
- expression[len + 1] = 0;
- if (len >= 0) {
- if (expression[0] == '#')
- continue;
- if ((expression[0] == '=') && (expression[1] == '>')) {
- char *str = &expression[2];
- if (expr != NULL) {
- xmlExpFree(ctxt, expr);
- if (xmlExpCtxtNbNodes(ctxt) != 0)
- printf(" Parse/free of Expression leaked %d\n",
- xmlExpCtxtNbNodes(ctxt));
- expr = NULL;
- }
- printf("Expression: %s\n", str) ;
- expr = xmlExpParse(ctxt, str);
- if (expr == NULL) {
- printf(" parsing Failed\n");
- break;
- }
- } else if (expr != NULL) {
- int expect = -1;
- int nodes1, nodes2;
- if (expression[0] == '0')
- expect = 0;
- if (expression[0] == '1')
- expect = 1;
- printf("Subexp: %s", expression + 2) ;
- nodes1 = xmlExpCtxtNbNodes(ctxt);
- sub = xmlExpParse(ctxt, expression + 2);
- if (sub == NULL) {
- printf(" parsing Failed\n");
- break;
- } else {
- int ret;
-
- nodes2 = xmlExpCtxtNbNodes(ctxt);
- ret = xmlExpSubsume(ctxt, expr, sub);
- if ((expect == 1) && (ret == 1)) {
- printf(" => accept, Ok\n");
- } else if ((expect == 0) && (ret == 0)) {
- printf(" => reject, Ok\n");
- } else if ((expect == 1) && (ret == 0)) {
- printf(" => reject, Failed\n");
- } else if ((expect == 0) && (ret == 1)) {
- printf(" => accept, Failed\n");
- } else {
- printf(" => fail internally\n");
- }
- if (xmlExpCtxtNbNodes(ctxt) > nodes2) {
- printf(" Subsume leaked %d\n",
- xmlExpCtxtNbNodes(ctxt) - nodes2);
- nodes1 += xmlExpCtxtNbNodes(ctxt) - nodes2;
- }
- xmlExpFree(ctxt, sub);
- if (xmlExpCtxtNbNodes(ctxt) > nodes1) {
- printf(" Parse/free leaked %d\n",
- xmlExpCtxtNbNodes(ctxt) - nodes1);
- }
- }
- }
- }
- }
- if (expr != NULL) {
- xmlExpFree(ctxt, expr);
- if (xmlExpCtxtNbNodes(ctxt) != 0)
- printf(" Parse/free of Expression leaked %d\n",
- xmlExpCtxtNbNodes(ctxt));
- }
- fclose(input);
- }
- static void
- testReduce(xmlExpCtxtPtr ctxt, xmlExpNodePtr expr, const char *tst) {
- xmlBufferPtr xmlExpBuf;
- xmlExpNodePtr sub, deriv;
- xmlExpBuf = xmlBufferCreate();
- sub = xmlExpParse(ctxt, tst);
- if (sub == NULL) {
- printf("Subset %s failed to parse\n", tst);
- return;
- }
- xmlExpDump(xmlExpBuf, sub);
- printf("Subset parsed as: %s\n",
- (const char *) xmlBufferContent(xmlExpBuf));
- deriv = xmlExpExpDerive(ctxt, expr, sub);
- if (deriv == NULL) {
- printf("Derivation led to an internal error, report this !\n");
- return;
- } else {
- xmlBufferEmpty(xmlExpBuf);
- xmlExpDump(xmlExpBuf, deriv);
- if (xmlExpIsNillable(deriv))
- printf("Resulting nillable derivation: %s\n",
- (const char *) xmlBufferContent(xmlExpBuf));
- else
- printf("Resulting derivation: %s\n",
- (const char *) xmlBufferContent(xmlExpBuf));
- xmlExpFree(ctxt, deriv);
- }
- xmlExpFree(ctxt, sub);
- }
- static void
- exprDebug(xmlExpCtxtPtr ctxt, xmlExpNodePtr expr) {
- xmlBufferPtr xmlExpBuf;
- xmlExpNodePtr deriv;
- const char *list[40];
- int ret;
- xmlExpBuf = xmlBufferCreate();
- if (expr == NULL) {
- printf("Failed to parse\n");
- return;
- }
- xmlExpDump(xmlExpBuf, expr);
- printf("Parsed as: %s\n", (const char *) xmlBufferContent(xmlExpBuf));
- printf("Max token input = %d\n", xmlExpMaxToken(expr));
- if (xmlExpIsNillable(expr) == 1)
- printf("Is nillable\n");
- ret = xmlExpGetLanguage(ctxt, expr, (const xmlChar **) &list[0], 40);
- if (ret < 0)
- printf("Failed to get list: %d\n", ret);
- else {
- int i;
- printf("Language has %d strings, testing string derivations\n", ret);
- for (i = 0;i < ret;i++) {
- deriv = xmlExpStringDerive(ctxt, expr, BAD_CAST list[i], -1);
- if (deriv == NULL) {
- printf(" %s -> derivation failed\n", list[i]);
- } else {
- xmlBufferEmpty(xmlExpBuf);
- xmlExpDump(xmlExpBuf, deriv);
- printf(" %s -> %s\n", list[i],
- (const char *) xmlBufferContent(xmlExpBuf));
- }
- xmlExpFree(ctxt, deriv);
- }
- }
- xmlBufferFree(xmlExpBuf);
- }
- #endif
- static void usage(const char *name) {
- fprintf(stderr, "Usage: %s [flags]\n", name);
- fprintf(stderr, "Testing tool for libxml2 string and pattern regexps\n");
- fprintf(stderr, " --debug: switch on debugging\n");
- fprintf(stderr, " --repeat: loop on the operation\n");
- #ifdef LIBXML_EXPR_ENABLED
- fprintf(stderr, " --expr: test xmlExp and not xmlRegexp\n");
- #endif
- fprintf(stderr, " --input filename: use the given filename for regexp\n");
- fprintf(stderr, " --input filename: use the given filename for exp\n");
- }
- int main(int argc, char **argv) {
- xmlRegexpPtr comp = NULL;
- #ifdef LIBXML_EXPR_ENABLED
- xmlExpNodePtr expr = NULL;
- int use_exp = 0;
- xmlExpCtxtPtr ctxt = NULL;
- #endif
- const char *pattern = NULL;
- char *filename = NULL;
- int i;
- xmlInitMemory();
- if (argc <= 1) {
- usage(argv[0]);
- return(1);
- }
- for (i = 1; i < argc ; i++) {
- if (!strcmp(argv[i], "-"))
- break;
- if (argv[i][0] != '-')
- continue;
- if (!strcmp(argv[i], "--"))
- break;
- if ((!strcmp(argv[i], "-debug")) || (!strcmp(argv[i], "--debug"))) {
- debug++;
- } else if ((!strcmp(argv[i], "-repeat")) ||
- (!strcmp(argv[i], "--repeat"))) {
- repeat++;
- #ifdef LIBXML_EXPR_ENABLED
- } else if ((!strcmp(argv[i], "-expr")) ||
- (!strcmp(argv[i], "--expr"))) {
- use_exp++;
- #endif
- } else if ((!strcmp(argv[i], "-i")) || (!strcmp(argv[i], "-f")) ||
- (!strcmp(argv[i], "--input")))
- filename = argv[++i];
- else {
- fprintf(stderr, "Unknown option %s\n", argv[i]);
- usage(argv[0]);
- }
- }
- #ifdef LIBXML_EXPR_ENABLED
- if (use_exp)
- ctxt = xmlExpNewCtxt(0, NULL);
- #endif
- if (filename != NULL) {
- #ifdef LIBXML_EXPR_ENABLED
- if (use_exp)
- runFileTest(ctxt, filename);
- else
- #endif
- testRegexpFile(filename);
- } else {
- int data = 0;
- #ifdef LIBXML_EXPR_ENABLED
- if (use_exp) {
- for (i = 1; i < argc ; i++) {
- if (strcmp(argv[i], "--") == 0)
- data = 1;
- else if ((argv[i][0] != '-') || (strcmp(argv[i], "-") == 0) ||
- (data == 1)) {
- if (pattern == NULL) {
- pattern = argv[i];
- printf("Testing expr %s:\n", pattern);
- expr = xmlExpParse(ctxt, pattern);
- if (expr == NULL) {
- printf(" failed to compile\n");
- break;
- }
- if (debug) {
- exprDebug(ctxt, expr);
- }
- } else {
- testReduce(ctxt, expr, argv[i]);
- }
- }
- }
- if (expr != NULL) {
- xmlExpFree(ctxt, expr);
- expr = NULL;
- }
- } else
- #endif
- {
- for (i = 1; i < argc ; i++) {
- if (strcmp(argv[i], "--") == 0)
- data = 1;
- else if ((argv[i][0] != '-') || (strcmp(argv[i], "-") == 0) ||
- (data == 1)) {
- if (pattern == NULL) {
- pattern = argv[i];
- printf("Testing %s:\n", pattern);
- comp = xmlRegexpCompile((const xmlChar *) pattern);
- if (comp == NULL) {
- printf(" failed to compile\n");
- break;
- }
- if (debug)
- xmlRegexpPrint(stdout, comp);
- } else {
- testRegexp(comp, argv[i]);
- }
- }
- }
- if (comp != NULL)
- xmlRegFreeRegexp(comp);
- }
- }
- #ifdef LIBXML_EXPR_ENABLED
- if (ctxt != NULL) {
- printf("Ops: %d nodes, %d cons\n",
- xmlExpCtxtNbNodes(ctxt), xmlExpCtxtNbCons(ctxt));
- xmlExpFreeCtxt(ctxt);
- }
- #endif
- xmlCleanupParser();
- xmlMemoryDump();
- return(0);
- }
- #else
- #include <stdio.h>
- int main(int argc ATTRIBUTE_UNUSED, char **argv ATTRIBUTE_UNUSED) {
- printf("%s : Regexp support not compiled in\n", argv[0]);
- return(0);
- }
- #endif /* LIBXML_REGEXP_ENABLED */
|