Context Navigation

source: branches/OKBJavaConnector/ECJClient/src/ec/util/Lexer.java @ 6934

Visit:

Last change on this file since 6934 was 6152, checked in by bfarka, 14 years ago
added ecj and custom statistics to communicate with the okb services #1441
File size: 2.8 KB

Line
1	package ec.util;
2	import java.util.regex.*;
3
4	/*
5	* Lexer.java
6	*
7	* Created: Sun Dec 5 11:33:43 EST 2010
8	* By: Sean Luke
9	*
10	*/
11
12	/**
13	* A simple line-by-line String tokenizer. You provide Lexer with a String or other
14	* CharSequence as input, plus an array of regular expressions. Each time you call
15	* nextToken(...), the Lexer matches the next token against the regular expressions
16	* and returns it. The regular expressions are checked in order, and the first one
17	* that matches is the winner.
18	*
19	*/
20
21	public class Lexer
22	{
23	/** An index which indicates that no further tokens were found. This could be due to the end of the string or due to a bad
24	string. You'll need to check the index to determine for sure.*/
25	public static final int FAILURE = -1;
26
27	CharSequence input;
28	int position = 0;
29	Matcher[] matchers;
30	String[] regexps;
31	int matchingIndex = FAILURE;
32
33	/** Builds a Lexer for the given input with the provided regular expressions. The regular expressions
34	will be checked in order against the input, and the first one which matches will be assumed to be the token.*/
35
36	public Lexer(CharSequence input, String[] regexps)
37	{
38	this.regexps = regexps;
39	matchers = new Matcher[regexps.length];
40	for(int i = 0 ; i < regexps.length; i++)
41	matchers[i] = Pattern.compile(regexps[i]).matcher(input); // not DOTALL
42	this.input = input;
43	}
44
45	/** Returns the next token as a string. If trim is true, then the string is first trimmed of whitespace. */
46	public String nextToken(boolean trim)
47	{
48	for(int i = 0 ; i < regexps.length; i++)
49	{
50	if (!matchers[i].region(position, input.length()).lookingAt()) continue;
51	position = matchers[i].end();
52	matchingIndex = i;
53	return ( trim ? matchers[i].group().trim() : matchers[i].group() );
54	}
55	// we failed
56	matchingIndex = -1;
57	return null;
58	}
59
60	/** Returns the next token as a string. The string is first trimmed of whitespace. */
61	public String nextToken() { return nextToken(true); }
62
63
64	/** Returns the index of the regular expression which matched the most recent token. */
65	public int getMatchingIndex()
66	{
67	return matchingIndex;
68	}
69
70	/** Returns the regular expression which matched the most recent token. */
71	public String getMatchingRule()
72	{
73	if (matchingIndex == -1) return null;
74	return regexps[matchingIndex];
75	}
76
77	/** Returns the position in the String just beyond the most recent token. */
78	public int getMatchingPosition()
79	{
80	return position;
81	}
82
83	}

Note: See TracBrowser for help on using the repository browser.

Download in other formats:

Update cookies preferences