XMLParserBase.java example

Explorer

studio2-master
- plugins
- tests
  - com.aptana.ide.core.io.tests
    - src
      - com
        aptana
        ide
        core
        io
        efs
        tests
        EFSUtilsTest.java
        LocalFileTest.java
        WorkspaceFileSystemTest.java
        WorkspaceFileTest.java
        tests
        BaseConnectionTest.java
        CommonConnectionTest.java
        filesystem
        ftp
        FTPCachedConnectionFileManager.java
        FTPCachedConnectionPoint.java
        tests
        AllTests.java
        FTPCachedConnectionTest.java
        FTPCommonConnectionTest.java
        FTPConnectionTest.java
        FTPConnectionWithBasePathTest.java
        SFTPConnectionTest.java
  - com.aptana.ide.core.spellcheck.tests
    - src
      - com
        aptana
        commons
        spelling
        engine
        AllTests.java
        NoCompletionsProposalTest.java
        SpellingAnnotationTest.java
        SpellingCorrectionProcessorTest.java
        TextInvocationContextTest.java
  - com.aptana.ide.core.tests
    - src
      - com
        aptana
        ide
        core
        io
        sync
        tests
        AllTests.java
        tests
        AllTests.java
        FileUtilsTest.java
        IdeLogTest.java
        KeyValuePairTest.java
        PackageTestCase.java
        PluginUtilsTest.java
        StreamUtilsTest.java
        StringUtilsTest.java
        TestingPlugin.java
        URLEncoderTest.java
        util
        FormattingUtils.java
        xpath
        XPathUtilsTest.java
      - jtest
        ProjectTestCase.java
  - com.aptana.ide.core.ui.tests
    - src
      - com
        aptana
        ide
        core
        io
        file
        tests
        AllTests.java
        tests
        AllTests.java
        ui
        tests
        AllTests.java
        CoreUIUtilsTest.java
        SetUtilsTest.java
        TestsPlugin.java
  - com.aptana.ide.debug.tests
    - src
      - com
        aptana
        ide
        debug
        test
        AbstractVariableInstruction.java
        AutomatedTestController.java
        BreakpointInstruction.java
        DelayInstruction.java
        GroupInstruction.java
        IInstruction.java
        IReference.java
        PrintValueInstruction.java
        SourceLineReferrence.java
        Startup.java
        StepInstruction.java
        SuspendResumeInstruction.java
        TerminateInstruction.java
        TestPlugin.java
        TestSession.java
        VerifyValueInstruction.java
  - com.aptana.ide.editor.css.tests
    - src
      - com
        aptana
        ide
        editor
        css
        tests
        AllTests.java
        TestIdentifierTokens.java
        TestKeywordTokens.java
        TestLiteralTokens.java
        TestPairFinder.java
        TestParseTime.java
        TestPunctuatorTokens.java
        TestStatements.java
        TestWhitespaceTokens.java
        TestsPlugin.java
        contentassist
        AllTests.java
        CSSContentAssistProcessorTest.java
        CSSUtilsTest.java
        editors
        css
        tests
        formatting
        AllTests.java
        FormattingTests.java
  - com.aptana.ide.editor.html.tests
    - src
      - com
        aptana
        ide
        editor
        html
        tests
        AllTests.java
        HTMLJSTest.java
        TestBugs.java
        TestDelimiterGroups.java
        TestKeywordTokens.java
        TestLiteralTokens.java
        TestPairFinder.java
        TestPunctuatorTokens.java
        TestStatements.java
        TestWhitespaceTokens.java
        TestingPlugin.java
        contentassist
        AllTests.java
        HTMLContentAssistProcessorTest.java
        HTMLUtilsTest.java
        formatting
        AllTests.java
        FormattingTests.java
        HTMLAutoIndentStrategyTest.java
  - com.aptana.ide.editor.js.tests
    - src
      - com
        aptana
        ide
        editor
        js
        tests
        AllTests.java
        Documentation2Tests.java
        JSLanguageEnvironmentTest.java
        TestComments.java
        TestDelimiterGroups.java
        TestIdentifierTokens.java
        TestKeywordTokens.java
        TestLexTime.java
        TestLiteralTokens.java
        TestPairFinder.java
        TestParseTime.java
        TestPunctuatorTokens.java
        TestStatements.java
        TestWhitespaceTokens.java
        TestingPlugin.java
        contentassist
        AllTests.java
        JSCompletionProposalTest.java
        JSContentAssistProcessorTest.java
        environment
        AllTests.java
        DOMTest.java
        JSCoreTest.java
        UserCodeTest.java
        formatting
        AllTests.java
        TestFormatting.java
        model
        AllTests.java
        TestArrayConstructor.java
        TestArrayFromInvocation.java
        TestArrayInstance.java
        TestBooleanConstructor.java
        TestBooleanFromInvocation.java
        TestBooleanInstance.java
        TestDateConstructor.java
        TestDateFromInvocation.java
        TestDateInstance.java
        TestErrorConstructor.java
        TestErrorFromInvocation.java
        TestErrorInstance.java
        TestFunctionConstructor.java
        TestFunctionFromInvocation.java
        TestFunctionInstance.java
        TestMathInstance.java
        TestModelBase.java
        TestNumberConstructor.java
        TestNumberFromInvocation.java
        TestNumberInstance.java
        TestObjectConstructor.java
        TestObjectFromInvocation.java
        TestObjectInstance.java
        TestProperties.java
        TestRegExpConstructor.java
        TestRegExpFromInvocation.java
        TestRegExpInstance.java
        TestStringConstructor.java
        TestStringFromInvocation.java
        TestStringInstance.java
        TestVariables.java
        outline
        AllTests.java
        ReusabilityTests.java
        TestBlockItems.java
        TestInheritanceItems.java
        TestOutlineItemBase.java
        TestScopeStrings.java
        TestSimpleItems.java
        testJSPartitions.java
        jscomment
        tests
        AllTests.java
        TestBugs.java
        TestDelimiterTokens.java
        TestLiteralTokens.java
        TestWhitespaceTokens.java
        scriptdoc
        tests
        AllTests.java
        TestDelimiterTokens.java
        TestDocumentationXML.java
        TestIdentifierTokens.java
        TestKeywordTokens.java
        TestLiteralTokens.java
        TestPunctuatorTokens.java
        TestWhitespaceTokens.java
        TransformOAATests.java
        runtime
        AllTests.java
        TestCodeGeneration.java
        TestOpcodes.java
  - com.aptana.ide.editor.xml.tests
    - src
      - com
        aptana
        ide
        editor
        xml
        tests
        AllTests.java
        TestBugs.java
        TestDTDTokens.java
        TestKeywordTokens.java
        TestLexTime.java
        TestLiteralTokens.java
        TestPairFinder.java
        TestParseTime.java
        TestPunctuatorTokens.java
        TestStatements.java
        TestingPlugin.java
        formatting
        AllTests.java
        FormattingTests.java
  - com.aptana.ide.editors.tests
    - src
      - com
        aptana
        ide
        editor
        junit
        profiles
        AllTests.java
        ProfileManagerTest.java
        ProfileTest.java
        editors
        junit
        AllTests.java
        ContentAssistTestCase.java
        ContentAssistTestSuite.java
        EditorsJunitPlugin.java
        GenericProject.java
        LexerUtils.java
        ProfileFile.java
        ProjectTestUtils.java
        TestCopyPasteAction.java
        TestDocumentCommand.java
        TestProject.java
        TestSelectionFormattingAction.java
        TestTextViewer.java
        TestUtils.java
        formatting
        AllTests.java
        SelectionFormattingTests.java
        UnifiedBracketInserterTest.java
        js
        AllTests.java
        JSEdgeCaseTests.java
        JSEdgeCasesProject.java
        JSTodoTests.java
        pairmatching
        AllTests.java
        PairMatchingTest.java
        partitions
        AllTests.java
        Messages.java
        PartitionsTest.java
        unified
        AllTests.java
        UnifiedViewerTest.java
        contentassist
        AbstractContentAssistProcessorTest.java
        AllTests.java
        CompletionProposalPopupTest.java
        UnifiedContentAssistProcessorTest.java
        tests
        views
        profiles
        AllTests.java
        ProfilesViewHelperTest.java
        unified
        errors
        tests
        AllTests.java
        ErrorDescriptorTest.java
  - com.aptana.ide.intro.tests
    - src
      - com
        aptana
        ide
        intro
        tests
        Activator.java
        AllTests.java
        OpenTestPageAction.java
        preferences
        AllTests.java
        FeatureDescriptorTest.java
        FeatureRegistryTest.java
        ProFeatureDescriptorTest.java
  - com.aptana.ide.logging.tests
    - src
      - com
        aptana
        ide
        logging
        impl
        AllTests.java
        InLineMatcherTest.java
        WorkspaceLogProviderTest.java
        tests
        AllTests.java
        FileWriterTest.java
        LoggingTestsPlugin.java
        PerfomanceTest.java
        ReaderWriterTest.java
  - com.aptana.ide.parsing.tests
    - src
      - com
        aptana
        ide
        lexer
        experimental
        CharAccessMethods.java
        FindAndReplace.java
        MatcherSpeedTests.java
        RegexMatchGroups.java
        ShowCategories.java
        matchers
        AllMatcherTests.java
        AndMatcherTest.java
        CharacterClassMatcherTest.java
        CharacterMatcherTest.java
        CommentMatcherTest.java
        DigitMatcherTest.java
        EndOfFileMatcherTest.java
        EndOfLineMatcherTest.java
        HexMatcherTest.java
        IdentifierMatcherTest.java
        LetterMatcherTest.java
        LetterOrDigitMatcherTest.java
        LineTerminatorMatcherTest.java
        LookaheadMatcherTest.java
        LowercaseLetterMatcherTest.java
        MatcherMapTest.java
        NumberMatcherTest.java
        OneOrMoreMatcherTest.java
        OptionalMatcherTest.java
        OrMatcherTest.java
        QuotedStringMatcherTest.java
        RegexMatcherTest.java
        RepetitionMatcherTest.java
        StartOfLineMatcherTest.java
        StringMatcherTest.java
        ToDelimiterMatcherTest.java
        UppercaseLetterMatcherTest.java
        WhitespaceMatcherTest.java
        WordBoundaryMatcherTest.java
        WordMatcherTest.java
        ZeroOrMoreMatcherTest.java
        tests
        AllTests.java
        TestLexeme.java
        TestLexemeList.java
        TestTokenBase.java
        metadata
        AllTests.java
        ElementMetadataTest.java
        MetadataItemTest.java
        MetadataRuntimeEnvironmentTest.java
        parsing
        bnf
        tests
        AllTests.java
        BootstrapTest.java
        ExpandedSourceTest.java
        FactoredGrammar.java
        FirstSetTest.java
        FollowSetTest.java
        ItemTests.java
        SampleGrammar.java
        SourceTest.java
        SymbolsTest.java
        TableTest.java
        TokenTypes.java
        experimental
        ASTHandlerParser.java
        AllTests.java
        BNFRunner.java
        Parser.java
        TestLRParserBuilder.java
        tests
        CoreTests.java
        ParseNodeTests.java
        ParseStateTests.java
        UITests.java
        xpath
        XPathStringTests.java
        XPathTests.java
        regex
        tests
        AllTests.java
        RegexTest.java
        TestStatements.java
  - com.aptana.ide.sax.tests
    - src
      - com
        aptana
        ide
        sax
        tests
        AllTests.java
        TestLexerSchemaBuilder.java
        TestMetadataSchemaBuilder.java
  - com.aptana.ide.server.core.tests
    - src
      - com
        aptana
        ide
        server
        AllServerCoreTests.java
        resources
        FileHttpResourceTest.java
        WorkspaceHttpFolderResourceTest.java
        WorkspaceHttpResourceTest.java
  - com.aptana.ide.server.tests
    - src
      - com
        aptana
        ide
        server
        tests
        AllTests.java
        ConfigurationTests.java
        ServerTypeDelegate.java
        ServersTest.java
        TestModuleType.java
        TestServer.java
  - com.aptana.ide.syncing.tests
    - src
      - com
        aptana
        ide
        io
        ftp
        tests
        AllTests.java
        syncing
        tests
        AllTests.java
        FTPSyncingTests.java
        FTPSyncingTestsWithSpaces.java
        LocalSyncingTests.java
        LocalSyncingTestsWithSpaces.java
        SyncingTests.java
        TestsPlugin.java
  - com.aptana.ide.tests
    - src
      - com
        aptana
        ide
        experimental
        ResourceVsFile.java
        UTFvsString.java
        WritingStrings.java
        tests
        AllPluginTests.java
        CoreTests.java
        TestsPlugin.java
        UITests.java
- tools
  - com.aptana.ide.parsing.tools
    - com
      - aptana
        parsing
        metadata
        oaa
        ClosureType.java
        OAAElementDefinition.java
        OAAHandler.java
        OAAList.java
        OAAParser.java
        OAAReference.java
        OAATest.java
        tools
        AllMetadataToBinary.java
        AllScriptDocsToBinary.java
        GenerateAllBinaries.java
        Messages.java
        MetadataToBinary.java
        ScriptDocToBinary.java
  - com.aptana.parsing.adapter
    - src
      - org
        eclipse
        core
        runtime
        IStatus.java
        Log.java
        Platform.java
        Plugin.java
        Preferences.java
        Status.java
        osgi
        util
        NLS.java
        osgi
        framework
        Bundle.java
        BundleContext.java
        Constants.java

/* ***** BEGIN LICENSE BLOCK *****
 * Version: GPL 3
 *
 * This program is Copyright (C) 2007-2008 Aptana, Inc. All Rights Reserved
 * This program is licensed under the GNU General Public license, version 3 (GPL).
 *
 * This program is distributed in the hope that it will be useful, but
 * AS-IS and WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE, TITLE, or
 * NONINFRINGEMENT. Redistribution, except as permitted by the GPL,
 * is prohibited.
 *
 * You can redistribute and/or modify this program under the terms of the GPL, 
 * as published by the Free Software Foundation.  You should
 * have received a copy of the GNU General Public License, Version 3 along
 * with this program; if not, write to the Free Software Foundation, Inc., 51
 * Franklin St, Fifth Floor, Boston, MA 02110-1301 USA.
 * 
 * Aptana provides a special exception to allow redistribution of this file
 * with certain other code and certain additional terms
 * pursuant to Section 7 of the GPL. You may view the exception and these
 * terms on the web at http://www.aptana.com/legal/gpl/.
 * 
 * You may view the GPL, and Aptana's exception and additional terms in the file
 * titled license-jaxer.html in the main distribution folder of this program.
 * 
 * Any modifications to this file must keep this entire header intact.
 *
 * ***** END LICENSE BLOCK ***** */
package com.aptana.ide.editor.xml.parsing;

import java.text.ParseException;

import com.aptana.ide.editor.xml.lexing.XMLTokenTypes;
import com.aptana.ide.editors.unified.parsing.UnifiedParser;
import com.aptana.ide.lexer.ILexer;
import com.aptana.ide.lexer.Lexeme;
import com.aptana.ide.lexer.LexerException;
import com.aptana.ide.lexer.Range;
import com.aptana.ide.parsing.IParseState;
import com.aptana.ide.parsing.ParserInitializationException;
import com.aptana.ide.parsing.nodes.IParseNode;

/**
 * @author Kevin Lindsey
 */
public class XMLParserBase extends UnifiedParser
{
	private static final String TEXT_GROUP = "text"; //$NON-NLS-1$
	private static final String ERROR_GROUP = "error"; //$NON-NLS-1$
	
	protected static final String DEFAULT_GROUP = "default"; //$NON-NLS-1$
	protected static final String XML_DECLARATION_GROUP = "xml-declaration"; //$NON-NLS-1$
	protected static final String CDATA_SECTION_GROUP = "cdata-section"; //$NON-NLS-1$
	protected static final String PROCESSING_INSTRUCTION_GROUP = "processing-instruction"; //$NON-NLS-1$
	
	public static final String DOCTYPE_DECLARATION_GROUP = "doctype-declaration"; //$NON-NLS-1$
	
	protected IParseNode _currentElement;
	
	/**
	 * XMLParserBase
	 * 
	 * @throws ParserInitializationException
	 */
	public XMLParserBase() throws ParserInitializationException
	{
		this(XMLMimeType.MimeType);
	}
	
	/**
	 * XMLParserBase
	 * 
	 * @param language
	 * @throws ParserInitializationException
	 */
	public XMLParserBase(String language) throws ParserInitializationException
	{
		super(language);
	}
	
	/**
	 * Advance to the next lexeme in the lexeme stream
	 * 
	 * @throws LexerException
	 */
	protected void advance() throws LexerException
	{
		ILexer lexer = this.getLexer();
		Lexeme currentLexeme = EOS;

		if (this._currentElement != null && this.currentLexeme != null && this.currentLexeme != EOS)
		{
			this._currentElement.includeLexemeInRange(this.currentLexeme);
		}
		
		if (lexer.isEOS() == false)
		{
			boolean inWhitespace = true;

			while (inWhitespace)
			{
				if (lexer.isEOS() == false)
				{
					currentLexeme = lexer.getNextLexeme();

					if (currentLexeme == null && lexer.isEOS() == false)
					{
						// Switch to error group.
						// NOTE: We want setGroup's exception to propagate since
						// that indicates an internal inconsistency when it
						// fails
						lexer.setGroup(ERROR_GROUP);

						currentLexeme = lexer.getNextLexeme();
					}

					if (currentLexeme != null)
					{
						if (currentLexeme.typeIndex == XMLTokenTypes.START_COMMENT)
						{
							// reset lexer position
							lexer.setCurrentOffset(currentLexeme.offset);

							// set group for unclosed comment type
							lexer.setGroup("unclosed-comment"); //$NON-NLS-1$

							// rescan
							currentLexeme = lexer.getNextLexeme();
						}
					}

					if (currentLexeme == null)
					{
						// couldn't recover from error, so mark as end of stream
						// NOTE: We may want to throw an exception here since we
						// should be able to return at least an ERROR token
						currentLexeme = EOS;
						inWhitespace = false;
					}
					else
					{
						this.addLexeme(currentLexeme);
						inWhitespace = false;
					}
				}
			}
		}

		this.currentLexeme = currentLexeme;
	}
	
	/**
	 * @see com.aptana.ide.parsing.AbstractParser#createParseState(com.aptana.ide.parsing.IParseState)
	 */
	public IParseState createParseState(IParseState parent)
	{
		IParseState result;
		
		if (parent == null)
		{
			result = new XMLParseState();
		}
		else
		{
			result = new XMLParseState(parent);
		}
		
		return result;
	}
	
	/**
	 * @see com.aptana.ide.parsing.AbstractParser#initializeLexer()
	 */
	public void initializeLexer() throws LexerException
	{
		ILexer lexer = this.getLexer();
		String language = this.getLanguage();

		// ignore whitespace
		lexer.setIgnoreSet(language, new int[] { XMLTokenTypes.WHITESPACE });
		lexer.setLanguageAndGroup(language, DEFAULT_GROUP);
	}
	
	/**
	 * parseDocTypeDeclaration
	 */
	protected void parseDocTypeDeclaration() throws LexerException
	{
		// NOTE: [KEL] ideally, this will be a nested language, but since we're in a bit of flux
		// with respect to colorization and parsing, I'm inlining DTD parsing here
		ILexer lexer = this.getLexer();
		int initialOffset = lexer.getEOFOffset();
		
		try
		{
			// find end of doctype section and apply to lexer virtual eof
			Range range = lexer.find("doctype-declaration-delimiter"); //$NON-NLS-1$
	
			int offset = range.getEndingOffset();
	
			if (range.isEmpty())
			{
				offset = lexer.getSourceLength();
			}
			
			lexer.setEOFOffset(offset);
			
			// change groups
			lexer.setGroup(DOCTYPE_DECLARATION_GROUP);
			
			this.advance();
			
			// process until eof
			while (this.isEOS() == false)
			{
				this.advance();
			}
		}
		finally
		{
			// restore original eof
			lexer.setEOFOffset(initialOffset);
			lexer.setGroup(DEFAULT_GROUP);
			
			// re-prime
			this.advance();
		}
	}
	
	/**
	 * parseText
	 * 
	 * @param verify
	 * @throws LexerException
	 * @throws ParseException 
	 */
	protected void parseText(boolean verify) throws LexerException, ParseException
	{
		// get reference to lexer
		ILexer lexer = this.getLexer();

		// switch to text group
		lexer.setGroup(TEXT_GROUP);

		// advance over '>' or '/>'
		if (verify)	
		{
			this.assertAndAdvance(XMLTokenTypes.GREATER_THAN, "error.tag.end.close"); //$NON-NLS-1$
		}
		else
		{
			this.advance();
		}

		// switch back to default group
		lexer.setGroup(DEFAULT_GROUP);

		if (this.currentLexeme == EOS || this.isType(XMLTokenTypes.ERROR))
		{
			if (this.currentLexeme != EOS)
			{
				lexer.setCurrentOffset(this.currentLexeme.offset);
				this.removeLexeme(this.currentLexeme);
			}

			// rescan in case we have a false EOS
			this.advance();
		}
	}
}