2 * testRegexp.c: simple module for testing regular expressions
4 * See Copyright for the status of this software.
6 * Daniel Veillard <veillard@redhat.com>
10 #ifdef LIBXML_REGEXP_ENABLED
13 #include <libxml/tree.h>
14 #include <libxml/xmlregexp.h>
16 static int repeat
= 0;
19 static void testRegexp(xmlRegexpPtr comp
, const char *value
) {
22 ret
= xmlRegexpExec(comp
, (const xmlChar
*) value
);
24 printf("%s: Ok\n", value
);
26 printf("%s: Fail\n", value
);
28 printf("%s: Error: %d\n", value
, ret
);
31 for (j
= 0;j
< 999999;j
++)
32 xmlRegexpExec(comp
, (const xmlChar
*) value
);
37 testRegexpFile(const char *filename
) {
38 xmlRegexpPtr comp
= NULL
;
40 char expression
[5000];
43 input
= fopen(filename
, "r");
45 xmlGenericError(xmlGenericErrorContext
,
46 "Cannot open %s for reading\n", filename
);
49 while (fgets(expression
, 4500, input
) != NULL
) {
50 len
= strlen(expression
);
53 ((expression
[len
] == '\n') || (expression
[len
] == '\t') ||
54 (expression
[len
] == '\r') || (expression
[len
] == ' '))) len
--;
55 expression
[len
+ 1] = 0;
57 if (expression
[0] == '#')
59 if ((expression
[0] == '=') && (expression
[1] == '>')) {
60 char *pattern
= &expression
[2];
63 xmlRegFreeRegexp(comp
);
66 printf("Regexp: %s\n", pattern
) ;
67 comp
= xmlRegexpCompile((const xmlChar
*) pattern
);
69 printf(" failed to compile\n");
72 } else if (comp
== NULL
) {
73 printf("Regexp: %s\n", expression
) ;
74 comp
= xmlRegexpCompile((const xmlChar
*) expression
);
76 printf(" failed to compile\n");
79 } else if (comp
!= NULL
) {
80 testRegexp(comp
, expression
);
86 xmlRegFreeRegexp(comp
);
89 #ifdef LIBXML_EXPR_ENABLED
91 runFileTest(xmlExpCtxtPtr ctxt
, const char *filename
) {
92 xmlExpNodePtr expr
= NULL
, sub
;
94 char expression
[5000];
97 input
= fopen(filename
, "r");
99 xmlGenericError(xmlGenericErrorContext
,
100 "Cannot open %s for reading\n", filename
);
103 while (fgets(expression
, 4500, input
) != NULL
) {
104 len
= strlen(expression
);
107 ((expression
[len
] == '\n') || (expression
[len
] == '\t') ||
108 (expression
[len
] == '\r') || (expression
[len
] == ' '))) len
--;
109 expression
[len
+ 1] = 0;
111 if (expression
[0] == '#')
113 if ((expression
[0] == '=') && (expression
[1] == '>')) {
114 char *str
= &expression
[2];
117 xmlExpFree(ctxt
, expr
);
118 if (xmlExpCtxtNbNodes(ctxt
) != 0)
119 printf(" Parse/free of Expression leaked %d\n",
120 xmlExpCtxtNbNodes(ctxt
));
123 printf("Expression: %s\n", str
) ;
124 expr
= xmlExpParse(ctxt
, str
);
126 printf(" parsing Failed\n");
129 } else if (expr
!= NULL
) {
133 if (expression
[0] == '0')
135 if (expression
[0] == '1')
137 printf("Subexp: %s", expression
+ 2) ;
138 nodes1
= xmlExpCtxtNbNodes(ctxt
);
139 sub
= xmlExpParse(ctxt
, expression
+ 2);
141 printf(" parsing Failed\n");
146 nodes2
= xmlExpCtxtNbNodes(ctxt
);
147 ret
= xmlExpSubsume(ctxt
, expr
, sub
);
149 if ((expect
== 1) && (ret
== 1)) {
150 printf(" => accept, Ok\n");
151 } else if ((expect
== 0) && (ret
== 0)) {
152 printf(" => reject, Ok\n");
153 } else if ((expect
== 1) && (ret
== 0)) {
154 printf(" => reject, Failed\n");
155 } else if ((expect
== 0) && (ret
== 1)) {
156 printf(" => accept, Failed\n");
158 printf(" => fail internally\n");
160 if (xmlExpCtxtNbNodes(ctxt
) > nodes2
) {
161 printf(" Subsume leaked %d\n",
162 xmlExpCtxtNbNodes(ctxt
) - nodes2
);
163 nodes1
+= xmlExpCtxtNbNodes(ctxt
) - nodes2
;
165 xmlExpFree(ctxt
, sub
);
166 if (xmlExpCtxtNbNodes(ctxt
) > nodes1
) {
167 printf(" Parse/free leaked %d\n",
168 xmlExpCtxtNbNodes(ctxt
) - nodes1
);
176 xmlExpFree(ctxt
, expr
);
177 if (xmlExpCtxtNbNodes(ctxt
) != 0)
178 printf(" Parse/free of Expression leaked %d\n",
179 xmlExpCtxtNbNodes(ctxt
));
185 testReduce(xmlExpCtxtPtr ctxt
, xmlExpNodePtr expr
, const char *tst
) {
186 xmlBufferPtr xmlExpBuf
;
187 xmlExpNodePtr sub
, deriv
;
188 xmlExpBuf
= xmlBufferCreate();
190 sub
= xmlExpParse(ctxt
, tst
);
192 printf("Subset %s failed to parse\n", tst
);
195 xmlExpDump(xmlExpBuf
, sub
);
196 printf("Subset parsed as: %s\n",
197 (const char *) xmlBufferContent(xmlExpBuf
));
198 deriv
= xmlExpExpDerive(ctxt
, expr
, sub
);
200 printf("Derivation led to an internal error, report this !\n");
203 xmlBufferEmpty(xmlExpBuf
);
204 xmlExpDump(xmlExpBuf
, deriv
);
205 if (xmlExpIsNillable(deriv
))
206 printf("Resulting nillable derivation: %s\n",
207 (const char *) xmlBufferContent(xmlExpBuf
));
209 printf("Resulting derivation: %s\n",
210 (const char *) xmlBufferContent(xmlExpBuf
));
211 xmlExpFree(ctxt
, deriv
);
213 xmlExpFree(ctxt
, sub
);
217 exprDebug(xmlExpCtxtPtr ctxt
, xmlExpNodePtr expr
) {
218 xmlBufferPtr xmlExpBuf
;
220 const char *list
[40];
223 xmlExpBuf
= xmlBufferCreate();
226 printf("Failed to parse\n");
229 xmlExpDump(xmlExpBuf
, expr
);
230 printf("Parsed as: %s\n", (const char *) xmlBufferContent(xmlExpBuf
));
231 printf("Max token input = %d\n", xmlExpMaxToken(expr
));
232 if (xmlExpIsNillable(expr
) == 1)
233 printf("Is nillable\n");
234 ret
= xmlExpGetLanguage(ctxt
, expr
, (const xmlChar
**) &list
[0], 40);
236 printf("Failed to get list: %d\n", ret
);
240 printf("Language has %d strings, testing string derivations\n", ret
);
241 for (i
= 0;i
< ret
;i
++) {
242 deriv
= xmlExpStringDerive(ctxt
, expr
, BAD_CAST list
[i
], -1);
244 printf(" %s -> derivation failed\n", list
[i
]);
246 xmlBufferEmpty(xmlExpBuf
);
247 xmlExpDump(xmlExpBuf
, deriv
);
248 printf(" %s -> %s\n", list
[i
],
249 (const char *) xmlBufferContent(xmlExpBuf
));
251 xmlExpFree(ctxt
, deriv
);
254 xmlBufferFree(xmlExpBuf
);
258 static void usage(const char *name
) {
259 fprintf(stderr
, "Usage: %s [flags]\n", name
);
260 fprintf(stderr
, "Testing tool for libxml2 string and pattern regexps\n");
261 fprintf(stderr
, " --debug: switch on debugging\n");
262 fprintf(stderr
, " --repeat: loop on the operation\n");
263 #ifdef LIBXML_EXPR_ENABLED
264 fprintf(stderr
, " --expr: test xmlExp and not xmlRegexp\n");
266 fprintf(stderr
, " --input filename: use the given filename for regexp\n");
267 fprintf(stderr
, " --input filename: use the given filename for exp\n");
270 int main(int argc
, char **argv
) {
271 xmlRegexpPtr comp
= NULL
;
272 #ifdef LIBXML_EXPR_ENABLED
273 xmlExpNodePtr expr
= NULL
;
275 xmlExpCtxtPtr ctxt
= NULL
;
277 const char *pattern
= NULL
;
278 char *filename
= NULL
;
287 for (i
= 1; i
< argc
; i
++) {
288 if (!strcmp(argv
[i
], "-"))
291 if (argv
[i
][0] != '-')
293 if (!strcmp(argv
[i
], "--"))
296 if ((!strcmp(argv
[i
], "-debug")) || (!strcmp(argv
[i
], "--debug"))) {
298 } else if ((!strcmp(argv
[i
], "-repeat")) ||
299 (!strcmp(argv
[i
], "--repeat"))) {
301 #ifdef LIBXML_EXPR_ENABLED
302 } else if ((!strcmp(argv
[i
], "-expr")) ||
303 (!strcmp(argv
[i
], "--expr"))) {
306 } else if ((!strcmp(argv
[i
], "-i")) || (!strcmp(argv
[i
], "-f")) ||
307 (!strcmp(argv
[i
], "--input")))
308 filename
= argv
[++i
];
310 fprintf(stderr
, "Unknown option %s\n", argv
[i
]);
315 #ifdef LIBXML_EXPR_ENABLED
317 ctxt
= xmlExpNewCtxt(0, NULL
);
320 if (filename
!= NULL
) {
321 #ifdef LIBXML_EXPR_ENABLED
323 runFileTest(ctxt
, filename
);
326 testRegexpFile(filename
);
329 #ifdef LIBXML_EXPR_ENABLED
332 for (i
= 1; i
< argc
; i
++) {
333 if (strcmp(argv
[i
], "--") == 0)
335 else if ((argv
[i
][0] != '-') || (strcmp(argv
[i
], "-") == 0) ||
337 if (pattern
== NULL
) {
339 printf("Testing expr %s:\n", pattern
);
340 expr
= xmlExpParse(ctxt
, pattern
);
342 printf(" failed to compile\n");
346 exprDebug(ctxt
, expr
);
349 testReduce(ctxt
, expr
, argv
[i
]);
354 xmlExpFree(ctxt
, expr
);
360 for (i
= 1; i
< argc
; i
++) {
361 if (strcmp(argv
[i
], "--") == 0)
363 else if ((argv
[i
][0] != '-') || (strcmp(argv
[i
], "-") == 0) ||
365 if (pattern
== NULL
) {
367 printf("Testing %s:\n", pattern
);
368 comp
= xmlRegexpCompile((const xmlChar
*) pattern
);
370 printf(" failed to compile\n");
374 xmlRegexpPrint(stdout
, comp
);
376 testRegexp(comp
, argv
[i
]);
381 xmlRegFreeRegexp(comp
);
384 #ifdef LIBXML_EXPR_ENABLED
386 printf("Ops: %d nodes, %d cons\n",
387 xmlExpCtxtNbNodes(ctxt
), xmlExpCtxtNbCons(ctxt
));
388 xmlExpFreeCtxt(ctxt
);
398 int main(int argc ATTRIBUTE_UNUSED
, char **argv ATTRIBUTE_UNUSED
) {
399 printf("%s : Regexp support not compiled in\n", argv
[0]);
402 #endif /* LIBXML_REGEXP_ENABLED */