001: /*
002: * gnu/regexp/util/RETest.java
003: * Copyright (C) 1998-2001 Wes Biggs
004: *
005: * This file is in the public domain. However, the gnu.regexp library
006: * proper is licensed under the terms of the GNU Lesser General Public
007: * License (see the file COPYING.LIB for details).
008: */
009: package gnu.regexp.util;
010:
011: import gnu.regexp.*;
012:
013: /**
014: * RETest provides a simple way to test regular expressions.
015: * It runs from the command line using the Java interpreter.
016: * To use it, enter the following from a command prompt (provided
017: * that the Java system knows where to find the RETest bytecodes):
018: * <BR><CODE>java gnu.regexp.util.RETest [regExp] [inputString]</CODE><BR>
019: * where <i>regExp</i> is a regular expression (you'll probably have
020: * to escape shell meta-characters) and <i>inputString</i> is the string
021: * to match against (again, put it in quotes or escape any shell meta-
022: * characters).
023: * <P>
024: * The test function will report the package version number, whether
025: * the expression matches the input string, what the match it found was,
026: * and the contents of any subexpressions, if applicable.
027: * <P>
028: * You may optionally add a third integer argument which is the number of
029: * times to repeat the test. When this option is used, RETest will report
030: * average compile and match times.
031: *
032: * @author <A HREF="mailto:wes@cacas.org">Wes Biggs</A>
033: * @version 1.01
034: */
035: public class RETest {
036: private RETest() {
037: }
038:
039: /**
040: * Invokes the test function with the command line arguments specified.
041: * See class description for usage notes.
042: *
043: * @param argv
044: * The command line arguments.
045: *
046: * @exception REException
047: * There was an error compiling or executing the regular expression.
048: */
049: public static void main(String argv[]) throws REException {
050: System.out.println("gnu.regexp version " + RE.version());
051:
052: int numRepeats = 1;
053: if (argv.length == 3)
054: numRepeats = Integer.parseInt(argv[2]);
055: if (argv.length < 2) {
056: System.out
057: .println("usage: java gnu.regexp.util.RETest regExp inputString [numRepeats]");
058: System.exit(1);
059: }
060:
061: // Construct the regular expression
062:
063: RE expression = null;
064: long begin = System.currentTimeMillis();
065:
066: for (int rpt = 0; rpt < numRepeats; rpt++)
067: expression = new RE(argv[0]);
068:
069: long end = System.currentTimeMillis();
070:
071: if (numRepeats > 1) {
072: System.out.println("Compiling " + numRepeats
073: + " times took " + (end - begin) + " ms");
074: System.out.println("Average compile time: "
075: + ((end - begin) / numRepeats) + " ms");
076: }
077:
078: // Display regular expression
079: System.out.println(" Input Text: " + argv[1]);
080: System.out.println("Regular Expression: " + argv[0]);
081: System.out.println(" Compiled Form: " + expression);
082: System.out.println(" Minimum Length: "
083: + expression.getMinimumLength());
084:
085: // Is the input in its entirety a match?
086: System.out.println(" isMatch() returns: "
087: + expression.isMatch(argv[1]));
088:
089: REMatch[] matches = expression.getAllMatches(argv[1]);
090: System.out.println(" getAllMatches(): " + matches.length
091: + " matches");
092: for (int i = 0; i < matches.length; i++) {
093: System.out.println("Match " + i + " ("
094: + matches[i].getStartIndex() + ","
095: + matches[i].getEndIndex() + "): " + matches[i]);
096: }
097:
098: // Get the first match
099: REMatch match = null;
100:
101: begin = System.currentTimeMillis();
102:
103: for (int rpt = 0; rpt < numRepeats; rpt++)
104: match = expression.getMatch(argv[1]);
105:
106: end = System.currentTimeMillis();
107:
108: if (numRepeats > 1) {
109: System.out.println("Finding first match " + numRepeats
110: + " times took " + (end - begin) + " ms");
111: System.out.println("Average match time: "
112: + ((end - begin) / numRepeats) + " ms");
113: }
114:
115: if (match == null)
116: System.out.println("Expression did not find a match.");
117: else {
118: // Report the full match indices
119:
120: System.out.println("Match found from position "
121: + match.getStartIndex() + " to position "
122: + match.getEndIndex());
123:
124: // Take advantage of REMatch.toString() to print match text
125:
126: System.out.println("Match was: '" + match + "'");
127:
128: // Report subexpression positions
129:
130: for (int i = 1; i <= expression.getNumSubs(); i++) {
131: if (match.getStartIndex(i) > -1) {
132: System.out.println("Subexpression #" + i
133: + ": from position "
134: + match.getStartIndex(i) + " to position "
135: + match.getEndIndex(i));
136:
137: // Note how the $n is constructed for substituteInto
138:
139: System.out
140: .println(match
141: .substituteInto("The subexpression matched this text: '$"
142: + i + "'"));
143: }
144: }
145: }
146:
147: // Here's a substitute test.
148: System.out.println("substitute(): "
149: + expression.substitute(argv[1], "<!--$0-->"));
150: System.out.println("substituteAll(): "
151: + expression.substituteAll(argv[1], "<!--$0-->"));
152: }
153: }
|