RegexParser.java example

Explorer

studio2-master
- plugins
- tests
  - com.aptana.ide.core.io.tests
    - src
      - com
        aptana
        ide
        core
        io
        efs
        tests
        EFSUtilsTest.java
        LocalFileTest.java
        WorkspaceFileSystemTest.java
        WorkspaceFileTest.java
        tests
        BaseConnectionTest.java
        CommonConnectionTest.java
        filesystem
        ftp
        FTPCachedConnectionFileManager.java
        FTPCachedConnectionPoint.java
        tests
        AllTests.java
        FTPCachedConnectionTest.java
        FTPCommonConnectionTest.java
        FTPConnectionTest.java
        FTPConnectionWithBasePathTest.java
        SFTPConnectionTest.java
  - com.aptana.ide.core.spellcheck.tests
    - src
      - com
        aptana
        commons
        spelling
        engine
        AllTests.java
        NoCompletionsProposalTest.java
        SpellingAnnotationTest.java
        SpellingCorrectionProcessorTest.java
        TextInvocationContextTest.java
  - com.aptana.ide.core.tests
    - src
      - com
        aptana
        ide
        core
        io
        sync
        tests
        AllTests.java
        tests
        AllTests.java
        FileUtilsTest.java
        IdeLogTest.java
        KeyValuePairTest.java
        PackageTestCase.java
        PluginUtilsTest.java
        StreamUtilsTest.java
        StringUtilsTest.java
        TestingPlugin.java
        URLEncoderTest.java
        util
        FormattingUtils.java
        xpath
        XPathUtilsTest.java
      - jtest
        ProjectTestCase.java
  - com.aptana.ide.core.ui.tests
    - src
      - com
        aptana
        ide
        core
        io
        file
        tests
        AllTests.java
        tests
        AllTests.java
        ui
        tests
        AllTests.java
        CoreUIUtilsTest.java
        SetUtilsTest.java
        TestsPlugin.java
  - com.aptana.ide.debug.tests
    - src
      - com
        aptana
        ide
        debug
        test
        AbstractVariableInstruction.java
        AutomatedTestController.java
        BreakpointInstruction.java
        DelayInstruction.java
        GroupInstruction.java
        IInstruction.java
        IReference.java
        PrintValueInstruction.java
        SourceLineReferrence.java
        Startup.java
        StepInstruction.java
        SuspendResumeInstruction.java
        TerminateInstruction.java
        TestPlugin.java
        TestSession.java
        VerifyValueInstruction.java
  - com.aptana.ide.editor.css.tests
    - src
      - com
        aptana
        ide
        editor
        css
        tests
        AllTests.java
        TestIdentifierTokens.java
        TestKeywordTokens.java
        TestLiteralTokens.java
        TestPairFinder.java
        TestParseTime.java
        TestPunctuatorTokens.java
        TestStatements.java
        TestWhitespaceTokens.java
        TestsPlugin.java
        contentassist
        AllTests.java
        CSSContentAssistProcessorTest.java
        CSSUtilsTest.java
        editors
        css
        tests
        formatting
        AllTests.java
        FormattingTests.java
  - com.aptana.ide.editor.html.tests
    - src
      - com
        aptana
        ide
        editor
        html
        tests
        AllTests.java
        HTMLJSTest.java
        TestBugs.java
        TestDelimiterGroups.java
        TestKeywordTokens.java
        TestLiteralTokens.java
        TestPairFinder.java
        TestPunctuatorTokens.java
        TestStatements.java
        TestWhitespaceTokens.java
        TestingPlugin.java
        contentassist
        AllTests.java
        HTMLContentAssistProcessorTest.java
        HTMLUtilsTest.java
        formatting
        AllTests.java
        FormattingTests.java
        HTMLAutoIndentStrategyTest.java
  - com.aptana.ide.editor.js.tests
    - src
      - com
        aptana
        ide
        editor
        js
        tests
        AllTests.java
        Documentation2Tests.java
        JSLanguageEnvironmentTest.java
        TestComments.java
        TestDelimiterGroups.java
        TestIdentifierTokens.java
        TestKeywordTokens.java
        TestLexTime.java
        TestLiteralTokens.java
        TestPairFinder.java
        TestParseTime.java
        TestPunctuatorTokens.java
        TestStatements.java
        TestWhitespaceTokens.java
        TestingPlugin.java
        contentassist
        AllTests.java
        JSCompletionProposalTest.java
        JSContentAssistProcessorTest.java
        environment
        AllTests.java
        DOMTest.java
        JSCoreTest.java
        UserCodeTest.java
        formatting
        AllTests.java
        TestFormatting.java
        model
        AllTests.java
        TestArrayConstructor.java
        TestArrayFromInvocation.java
        TestArrayInstance.java
        TestBooleanConstructor.java
        TestBooleanFromInvocation.java
        TestBooleanInstance.java
        TestDateConstructor.java
        TestDateFromInvocation.java
        TestDateInstance.java
        TestErrorConstructor.java
        TestErrorFromInvocation.java
        TestErrorInstance.java
        TestFunctionConstructor.java
        TestFunctionFromInvocation.java
        TestFunctionInstance.java
        TestMathInstance.java
        TestModelBase.java
        TestNumberConstructor.java
        TestNumberFromInvocation.java
        TestNumberInstance.java
        TestObjectConstructor.java
        TestObjectFromInvocation.java
        TestObjectInstance.java
        TestProperties.java
        TestRegExpConstructor.java
        TestRegExpFromInvocation.java
        TestRegExpInstance.java
        TestStringConstructor.java
        TestStringFromInvocation.java
        TestStringInstance.java
        TestVariables.java
        outline
        AllTests.java
        ReusabilityTests.java
        TestBlockItems.java
        TestInheritanceItems.java
        TestOutlineItemBase.java
        TestScopeStrings.java
        TestSimpleItems.java
        testJSPartitions.java
        jscomment
        tests
        AllTests.java
        TestBugs.java
        TestDelimiterTokens.java
        TestLiteralTokens.java
        TestWhitespaceTokens.java
        scriptdoc
        tests
        AllTests.java
        TestDelimiterTokens.java
        TestDocumentationXML.java
        TestIdentifierTokens.java
        TestKeywordTokens.java
        TestLiteralTokens.java
        TestPunctuatorTokens.java
        TestWhitespaceTokens.java
        TransformOAATests.java
        runtime
        AllTests.java
        TestCodeGeneration.java
        TestOpcodes.java
  - com.aptana.ide.editor.xml.tests
    - src
      - com
        aptana
        ide
        editor
        xml
        tests
        AllTests.java
        TestBugs.java
        TestDTDTokens.java
        TestKeywordTokens.java
        TestLexTime.java
        TestLiteralTokens.java
        TestPairFinder.java
        TestParseTime.java
        TestPunctuatorTokens.java
        TestStatements.java
        TestingPlugin.java
        formatting
        AllTests.java
        FormattingTests.java
  - com.aptana.ide.editors.tests
    - src
      - com
        aptana
        ide
        editor
        junit
        profiles
        AllTests.java
        ProfileManagerTest.java
        ProfileTest.java
        editors
        junit
        AllTests.java
        ContentAssistTestCase.java
        ContentAssistTestSuite.java
        EditorsJunitPlugin.java
        GenericProject.java
        LexerUtils.java
        ProfileFile.java
        ProjectTestUtils.java
        TestCopyPasteAction.java
        TestDocumentCommand.java
        TestProject.java
        TestSelectionFormattingAction.java
        TestTextViewer.java
        TestUtils.java
        formatting
        AllTests.java
        SelectionFormattingTests.java
        UnifiedBracketInserterTest.java
        js
        AllTests.java
        JSEdgeCaseTests.java
        JSEdgeCasesProject.java
        JSTodoTests.java
        pairmatching
        AllTests.java
        PairMatchingTest.java
        partitions
        AllTests.java
        Messages.java
        PartitionsTest.java
        unified
        AllTests.java
        UnifiedViewerTest.java
        contentassist
        AbstractContentAssistProcessorTest.java
        AllTests.java
        CompletionProposalPopupTest.java
        UnifiedContentAssistProcessorTest.java
        tests
        views
        profiles
        AllTests.java
        ProfilesViewHelperTest.java
        unified
        errors
        tests
        AllTests.java
        ErrorDescriptorTest.java
  - com.aptana.ide.intro.tests
    - src
      - com
        aptana
        ide
        intro
        tests
        Activator.java
        AllTests.java
        OpenTestPageAction.java
        preferences
        AllTests.java
        FeatureDescriptorTest.java
        FeatureRegistryTest.java
        ProFeatureDescriptorTest.java
  - com.aptana.ide.logging.tests
    - src
      - com
        aptana
        ide
        logging
        impl
        AllTests.java
        InLineMatcherTest.java
        WorkspaceLogProviderTest.java
        tests
        AllTests.java
        FileWriterTest.java
        LoggingTestsPlugin.java
        PerfomanceTest.java
        ReaderWriterTest.java
  - com.aptana.ide.parsing.tests
    - src
      - com
        aptana
        ide
        lexer
        experimental
        CharAccessMethods.java
        FindAndReplace.java
        MatcherSpeedTests.java
        RegexMatchGroups.java
        ShowCategories.java
        matchers
        AllMatcherTests.java
        AndMatcherTest.java
        CharacterClassMatcherTest.java
        CharacterMatcherTest.java
        CommentMatcherTest.java
        DigitMatcherTest.java
        EndOfFileMatcherTest.java
        EndOfLineMatcherTest.java
        HexMatcherTest.java
        IdentifierMatcherTest.java
        LetterMatcherTest.java
        LetterOrDigitMatcherTest.java
        LineTerminatorMatcherTest.java
        LookaheadMatcherTest.java
        LowercaseLetterMatcherTest.java
        MatcherMapTest.java
        NumberMatcherTest.java
        OneOrMoreMatcherTest.java
        OptionalMatcherTest.java
        OrMatcherTest.java
        QuotedStringMatcherTest.java
        RegexMatcherTest.java
        RepetitionMatcherTest.java
        StartOfLineMatcherTest.java
        StringMatcherTest.java
        ToDelimiterMatcherTest.java
        UppercaseLetterMatcherTest.java
        WhitespaceMatcherTest.java
        WordBoundaryMatcherTest.java
        WordMatcherTest.java
        ZeroOrMoreMatcherTest.java
        tests
        AllTests.java
        TestLexeme.java
        TestLexemeList.java
        TestTokenBase.java
        metadata
        AllTests.java
        ElementMetadataTest.java
        MetadataItemTest.java
        MetadataRuntimeEnvironmentTest.java
        parsing
        bnf
        tests
        AllTests.java
        BootstrapTest.java
        ExpandedSourceTest.java
        FactoredGrammar.java
        FirstSetTest.java
        FollowSetTest.java
        ItemTests.java
        SampleGrammar.java
        SourceTest.java
        SymbolsTest.java
        TableTest.java
        TokenTypes.java
        experimental
        ASTHandlerParser.java
        AllTests.java
        BNFRunner.java
        Parser.java
        TestLRParserBuilder.java
        tests
        CoreTests.java
        ParseNodeTests.java
        ParseStateTests.java
        UITests.java
        xpath
        XPathStringTests.java
        XPathTests.java
        regex
        tests
        AllTests.java
        RegexTest.java
        TestStatements.java
  - com.aptana.ide.sax.tests
    - src
      - com
        aptana
        ide
        sax
        tests
        AllTests.java
        TestLexerSchemaBuilder.java
        TestMetadataSchemaBuilder.java
  - com.aptana.ide.server.core.tests
    - src
      - com
        aptana
        ide
        server
        AllServerCoreTests.java
        resources
        FileHttpResourceTest.java
        WorkspaceHttpFolderResourceTest.java
        WorkspaceHttpResourceTest.java
  - com.aptana.ide.server.tests
    - src
      - com
        aptana
        ide
        server
        tests
        AllTests.java
        ConfigurationTests.java
        ServerTypeDelegate.java
        ServersTest.java
        TestModuleType.java
        TestServer.java
  - com.aptana.ide.syncing.tests
    - src
      - com
        aptana
        ide
        io
        ftp
        tests
        AllTests.java
        syncing
        tests
        AllTests.java
        FTPSyncingTests.java
        FTPSyncingTestsWithSpaces.java
        LocalSyncingTests.java
        LocalSyncingTestsWithSpaces.java
        SyncingTests.java
        TestsPlugin.java
  - com.aptana.ide.tests
    - src
      - com
        aptana
        ide
        experimental
        ResourceVsFile.java
        UTFvsString.java
        WritingStrings.java
        tests
        AllPluginTests.java
        CoreTests.java
        TestsPlugin.java
        UITests.java
- tools
  - com.aptana.ide.parsing.tools
    - com
      - aptana
        parsing
        metadata
        oaa
        ClosureType.java
        OAAElementDefinition.java
        OAAHandler.java
        OAAList.java
        OAAParser.java
        OAAReference.java
        OAATest.java
        tools
        AllMetadataToBinary.java
        AllScriptDocsToBinary.java
        GenerateAllBinaries.java
        Messages.java
        MetadataToBinary.java
        ScriptDocToBinary.java
  - com.aptana.parsing.adapter
    - src
      - org
        eclipse
        core
        runtime
        IStatus.java
        Log.java
        Platform.java
        Plugin.java
        Preferences.java
        Status.java
        osgi
        util
        NLS.java
        osgi
        framework
        Bundle.java
        BundleContext.java
        Constants.java

/**
 * This file Copyright (c) 2005-2008 Aptana, Inc. This program is
 * dual-licensed under both the Aptana Public License and the GNU General
 * Public license. You may elect to use one or the other of these licenses.
 * 
 * This program is distributed in the hope that it will be useful, but
 * AS-IS and WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE, TITLE, or
 * NONINFRINGEMENT. Redistribution, except as permitted by whichever of
 * the GPL or APL you select, is prohibited.
 *
 * 1. For the GPL license (GPL), you can redistribute and/or modify this
 * program under the terms of the GNU General Public License,
 * Version 3, as published by the Free Software Foundation.  You should
 * have received a copy of the GNU General Public License, Version 3 along
 * with this program; if not, write to the Free Software Foundation, Inc., 51
 * Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 * 
 * Aptana provides a special exception to allow redistribution of this file
 * with certain other free and open source software ("FOSS") code and certain additional terms
 * pursuant to Section 7 of the GPL. You may view the exception and these
 * terms on the web at http://www.aptana.com/legal/gpl/.
 * 
 * 2. For the Aptana Public License (APL), this program and the
 * accompanying materials are made available under the terms of the APL
 * v1.0 which accompanies this distribution, and is available at
 * http://www.aptana.com/legal/apl/.
 * 
 * You may view the GPL, Aptana's exception and additional terms, and the
 * APL in the file titled license.html at the root of the corresponding
 * plugin containing this source file.
 * 
 * Any modifications to this file must keep this entire header intact.
 */
package com.aptana.ide.regex;

import java.text.MessageFormat;
import java.text.ParseException;
import java.util.Stack;

import com.aptana.ide.regex.dfa.DFAGraph;
import com.aptana.ide.regex.inputs.AnyInput;
import com.aptana.ide.regex.inputs.CharacterClassInput;
import com.aptana.ide.regex.inputs.CharacterInput;
import com.aptana.ide.regex.inputs.DigitInput;
import com.aptana.ide.regex.inputs.Input;
import com.aptana.ide.regex.inputs.WhiteSpaceInput;
import com.aptana.ide.regex.inputs.WordInput;
import com.aptana.ide.regex.nfa.NFAGraph;

/**
 * Converts a regular expression expressed as a string into a state machine. This state machine can be used to recognize
 * text patterns as described by the original regular expression
 * <p>
 * <code>
 * This parser recognizes the following grammar:
 * <p>
 * Expression
 *     : OrExpression
 *     | '^' OrExpression
 *     | OrExpression '$'
 *     ;
 * OrExpression
 *     : OrExpression '|' AndExpression
 *     | AndExpression
 *     ;
 * AndExpression
 *     : AndExpression Factor
 *     | Factor
 *     ;
 * Factor
 *     : Term '*'
 *     | Term '+'
 *     | Term '?'
 *     | Term
 *     ;
 * Term
 *     : '[' string ']'
 *     | '[^' string ']'
 *     | '[]'
 *     | '[^]'
 *     | '.'
 *     | * character
 *     | * '(' Expression ')'
 *     ;
 * </code>
 * 
 * @author Kevin Lindsey
 */
public class RegexParser
{
	private char[] _regex;
	private int _index;
	Stack<NFAGraph> _nfaStack;
	int _acceptState;
	DFAGraph _dfa;

	/**
	 * @return The current character being processed in the regular expression
	 */
	private char getCurrentChar()
	{
		char result;

		if (this.getEOS() == false)
		{
			result = this._regex[this._index];
		}
		else
		{
			result = '\0';
		}

		return result;
	}

	/**
	 * Determine if the specified digit is a hexadecimal digit
	 * 
	 * @return Returns true if the character is a valid hexadecimal digit
	 */
	private boolean isHexDigit()
	{
		char digit = this.getCurrentChar();

		return ('0' <= digit && digit <= '9' || 'A' <= digit && digit <= 'F' || 'a' <= digit && digit <= 'f');
	}

	/**
	 * Return the DFA that recognizes the parsed regular expression
	 * 
	 * @return The DFA that recognizes the parsed regular expression
	 */
	public DFAGraph getDFAGraph()
	{
		return this._dfa;
	}

	/**
	 * Determines if we have reached the end of the regular expression string
	 * 
	 * @return A boolean that returns true once we have processed the entire regular expression string
	 */
	private boolean getEOS()
	{
		return (this._index >= this._regex.length);
	}

	/**
	 * Get the resulting NFA graph associated with the regex
	 * 
	 * @return Returns the NFA Graph associated with this regex
	 */
	public NFAGraph getNFAGraph()
	{
		NFAGraph result = null;

		if (this._nfaStack.size() > 0)
		{
			result = this._nfaStack.peek();
		}

		return result;
	}

	/**
	 * Get the stack of NFA machines created by this parser
	 * 
	 * @return The NFA stack
	 */
	public Stack<NFAGraph> getNFAStack()
	{
		return this._nfaStack;
	}

	/**
	 * Determines if the current character is a valid character to start a new And expression
	 * 
	 * @return Returns true if the current character can start an And expression
	 */
	private boolean isFirstInAndExpression()
	{
		boolean result = true;

		if (this.getEOS() == false)
		{
			switch (this.getCurrentChar())
			{
				case '\0':
				case '|':
				case ')':
				case '*':
				case '+':
				case '?':
				case '^':
				case '$':
					result = false;
					break;

				default:
					break;
			}
		}
		else
		{
			result = false;
		}

		return result;
	}

	/*
	 * Constructors
	 */

	/**
	 * Create a new instance of RegexParser
	 */
	public RegexParser()
	{
		this._nfaStack = new Stack<NFAGraph>();
	}

	/*
	 * Methods
	 */

	/**
	 * Advance to the next non-whitespace character
	 */
	private void advance()
	{
		int length = this._regex.length;

		if (this._index < length)
		{
			// advance at least one character
			this._index++;

			// now skip whitespace
			while (this._index < length && Character.isWhitespace(this._regex[this._index]))
			{
				this._index++;
			}
		}
	}

	/**
	 * Convert a regular expression expressed as a string into a DFA that recognizes the text pattern described by the
	 * regular expression. This method will associate a token index, lexer state, and new lexer state with this regular
	 * expression when it matches
	 * 
	 * @param regex
	 *            The regex to parse
	 * @param acceptState
	 *            The accept state to associate with this regex
	 * @throws ParseException
	 */
	public void parse(String regex, int acceptState) throws ParseException
	{
		if (regex == null)
		{
			throw new NullPointerException(Messages.RegexParser_Undefined);
		}
		if (regex.length() == 0)
		{
			throw new ParseException(Messages.RegexParser_Empty, 0);
		}

		this._regex = regex.toCharArray();
		this._index = -1;
		this._acceptState = acceptState;

		// prime current character
		this.advance();

		// parse regex
		if (this.parseExpression() == false)
		{
			Object[] messageArgs = new Object[] { regex, Integer.toString(this._index) };
			String message = MessageFormat.format(Messages.RegexParser_Parse_Error, messageArgs);

			throw new ParseException(message, 0);
		}
	}

	/**
	 * Parse a regular expression
	 * 
	 * @return A boolean that indicates whether the expression was successfully parsed or not.
	 */
	private boolean parseExpression()
	{
		boolean success = true;

		if (this.getCurrentChar() == '^')
		{
			// advance over '^'
			this.advance();

			// tag to anchor at the beginning of a line
		}

		while (success && this.getEOS() == false)
		{
			success = this.parseOrExpression();

			if (this._index == this._regex.length - 1 && this.getCurrentChar() == '$')
			{
				// advance over '$'
				this.advance();

				// tag to anchor at the end of a line
			}
		}

		return success;
	}

	/**
	 * Parse a regular expression OR expression
	 * 
	 * @return A boolean that indicates whether the expression was successfully parsed or not.
	 */
	private boolean parseOrExpression()
	{
		boolean success = true;

		if (this.parseAndExpression())
		{
			while (this.getCurrentChar() == '|')
			{
				// advance over '|'
				this.advance();

				// parse |'s right hand side
				if (this.parseAndExpression())
				{
					// build OR machine
					NFAGraph rhs = this._nfaStack.pop();
					NFAGraph lhs = this._nfaStack.peek();

					lhs.orMachines(rhs);
				}
				else
				{
					success = false;
					break;
				}
			}
		}
		else
		{
			success = false;
		}

		return success;
	}

	/**
	 * Parse a regular expression AND expression
	 * 
	 * @return A boolean that indicates whether the expression was successfully parsed or not.
	 */
	private boolean parseAndExpression()
	{
		boolean success = true;

		if (this.isFirstInAndExpression())
		{
			// get left-hand side
			this.parseFactor();

			// get remaining right-hand sides
			while (this.isFirstInAndExpression())
			{
				if (this.parseFactor())
				{
					// build AND machine
					NFAGraph rhs = this._nfaStack.pop();
					NFAGraph lhs = this._nfaStack.peek();

					lhs.andMachines(rhs);
				}
				else
				{
					success = false;
					break;
				}
			}
		}
		else
		{
			success = false;
		}

		return success;
	}

	/**
	 * Parse a regular expression factor
	 * 
	 * @return A boolean that indicates whether the expression was successfully parsed or not.
	 */
	private boolean parseFactor()
	{
		boolean success = true;

		if (this.parseTerm())
		{
			NFAGraph nfa = this._nfaStack.peek();

			switch (this.getCurrentChar())
			{
				case '*':
					// advance over '*' and build kleene closure
					this.advance();
					nfa.kleeneClosure();
					break;

				case '+':
					// advance over '+' and build positive closure
					this.advance();
					nfa.positiveClosure();
					break;

				case '?':
					// advance over '?' and build option
					this.advance();
					nfa.option();
					break;

				default:
					break;
			}
		}
		else
		{
			success = false;
		}

		return success;
	}

	/**
	 * Parse a regular expression term
	 * 
	 * @return A boolean that indicates whether the expression was successfully parsed or not.
	 */
	private boolean parseTerm()
	{
		boolean success = true;

		if (this.getCurrentChar() == '(')
		{
			// parse parenthetical sub-expression
			success = this.parseSubExpression();
		}
		else
		{
			NFAGraph newState = new NFAGraph(this._acceptState);

			switch (this.getCurrentChar())
			{
				case '.':
					// advance over '.' and add input type
					this.advance();
					newState.add(new AnyInput());
					break;

				case '\\':
					// parse escaped term
					newState.add(this.parseEscapedTerm());
					break;

				case '[':
					// parse character class
					newState.add(this.parseCharacterClass());
					break;

				default:
					// add character state
					newState.add(new CharacterInput(this.getCurrentChar()));

					// advance over character
					this.advance();
			}

			if (success)
			{
				this._nfaStack.push(newState);
			}
		}

		return success;
	}

	/**
	 * Parse a character class
	 */
	private Input parseCharacterClass()
	{
		// advance over '['
		this.advance();

		CharacterClassInput cci = new CharacterClassInput();
		char last = '\0';

		if (this.getCurrentChar() == '^')
		{
			// advance over '^'
			this.advance();

			// find complement of character class
			cci.setComplement(true);
		}

		if (this.getCurrentChar() == '-')
		{
			// add dash as input
			cci.addInput('-');

			// advance over '-'
			this.advance();
		}

		while (this.getEOS() == false && this.getCurrentChar() != ']')
		{
			switch (this.getCurrentChar())
			{
				case '-':
					// advance over '-'
					this.advance();

					if (last != '\0')
					{
						// build character set
						cci.addInputs(last, this.getCurrentChar());

						// advance over character
						this.advance();

						// rest last to catch hyphen errors
						last = '\0';
					}
					else
					{
						// error
						break;
					}
					break;

				case '\\':
					Input input = this.parseEscapedTerm();

					cci.addInputs(input.getCharacters());
					break;

				default:
					last = this.getCurrentChar();
					cci.addInput(last);

					// advance over character
					this.advance();

			}
			
//			if (this.getCurrentChar() == '-')
//			{
//				// advance over '-'
//				this.advance();
//				if (last != '\0')
//				{
//					// build character set
//					cci.addInputs(last, this.getCurrentChar());
//					// advance over character
//					this.advance();
//					// rest last to catch hyphen errors
//					last = '\0';
//				}
//				else
//				{
//					// error break;
//				}
//			}
//			else if (this.getCurrentChar() == '\\')
//			{
//				Input input = this.parseEscapedTerm();
//				cci.addInputs(input.getCharacters());
//			}
//			else
//			{
//				last = this.getCurrentChar();
//				cci.addInput(last);
//				// advance over character
//				this.advance();
//			}
		}

		if (this.getCurrentChar() == ']')
		{
			// advance over ']'
			this.advance();

			// save input
			// newState.addState(cci);
		}
		else
		{
			// success = false
		}

		return cci;
	}

	/**
	 * Parse a term escaped with a backslash
	 * 
	 * @return A boolean that indicates whether the expression was successfully parsed or not.
	 */
	private Input parseEscapedTerm()
	{
		Input result = null;

		// advance over '\'
		// this.advance();

		// NOTE: we can't use advance because it might skip over the next
		// character
		// if it is whitespace
		this._index++;

		switch (this.getCurrentChar())
		{
			case 'd':
				result = new DigitInput();
				break;

			case 'D':
				result = new DigitInput();
				result.setComplement(true);
				break;

			case 'f':
				result = new CharacterInput('\f');
				break;

			case 'n':
				result = new CharacterInput('\n');
				break;

			case 'r':
				result = new CharacterInput('\r');
				break;

			case 's':
				result = new WhiteSpaceInput();
				break;

			case 'S':
				result = new WhiteSpaceInput();
				result.setComplement(true);
				break;

			case 't':
				result = new CharacterInput('\t');
				break;

			case 'v':
				result = new CharacterInput('\u000B');
				break;

			case 'w':
				result = new WordInput();
				break;

			case 'W':
				result = new WordInput();
				result.setComplement(true);
				break;

			case 'x':
				int hi = 0;
				int lo = 0;

				this._index++;

				if (this.isHexDigit())
				{
					hi = Character.digit(getCurrentChar(), 16);

					// NOTE: we can't use advance because it might skip over the next
					// character
					// if it is whitespace
					this._index++;

					if (this.isHexDigit())
					{
						lo = Character.digit(getCurrentChar(), 16);
					}
					else
					{
						throw new IllegalStateException(Messages.RegexParser_Malformed_Hex);
					}
				}
				else
				{
					throw new IllegalStateException(Messages.RegexParser_Malformed_Hex);
				}

				result = new CharacterInput((char) (hi * 16 + lo));
				break;

			default:
				result = new CharacterInput(this.getCurrentChar());
				break;
		}

		// advance over term
		this.advance();

		return result;
	}

	/**
	 * Parse an expression inside of a parenthetical expression
	 * 
	 * @return A boolean that indicates whether the expression was successfully parsed or not.
	 */
	private boolean parseSubExpression()
	{
		boolean success = true;

		// advance over '('
		this.advance();

		if (this.parseOrExpression())
		{
			if (this.getCurrentChar() == ')')
			{
				// advance over ')'
				this.advance();
			}
			else
			{
				success = false;
			}
		}
		else
		{
			success = false;
		}

		return success;
	}

	/**
	 * Reset the parser in preparation for a new parse
	 */
	public void reset()
	{
		NFAGraph.reset();
		this._nfaStack.clear();
	}
}