RubyTokenScanner.java example

Explorer

rdt-master
- plugins
- tests
  - com.aptana.rdt.tests
    - src
      - com
        aptana
        rdt
        AptanaRDTTests.java
        TS_Aptana.java
        core
        rspec
        RSpecStructureCreatorTest.java
        internal
        core
        gems
        AbstractGemParserTestCase.java
        AllTests.java
        GemManagerTest.java
        GemOnePointTwoParserTest.java
        GemParserTest.java
        HybridGemParserTest.java
        ShortListingGemParserTest.java
        parser
        warnings
        AccidentalBooleanAssignmentVisitorTest.java
        ConstantNamingConventionTest.java
        ControlCoupleTest.java
        DynamicVariableAliasesLocalTest.java
        FeatureEnvyTest.java
        LocalsMaskingMethodsVisitorTest.java
        MockProblemRequestor.java
        TC_CodeComplexity.java
        TC_CodeComplexityMaxLocals.java
        TC_CodeComplexityTooManyArguments.java
        TC_CodeComplexityTooManyReturns.java
        TC_ComparableInclusionVisitor.java
        TC_EnumerableInclusionVisitor.java
        TC_SimilarVariableNameVisitor.java
        TC_UnecessaryElseVisitor.java
        TS_ParserWarnings.java
        UncommunicativeNameTest.java
        WarningVisitorTest.java
  - org.rubypeople.eclipse.shams
    - src
      - org
        rubypeople
        eclipse
        shams
        debug
        core
        ShamLaunchConfiguration.java
        ShamLaunchConfigurationType.java
        ShamLaunchConfigurationWorkingCopy.java
        ShamLaunchManager.java
        resources
        ShamContainer.java
        ShamFile.java
        ShamFolder.java
        ShamProject.java
        ShamResource.java
        ShamResourceProxy.java
        runtime
        ShamException.java
        ShamIPath.java
        ShamPreferences.java
  - org.rubypeople.eclipse.testutils
    - src
      - org
        rubypeople
        eclipse
        testutils
        ResourceTools.java
  - org.rubypeople.rdt.core.tests
    - src
      - org
        rubypeople
        rdt
        TS_RdtCore.java
        core
        formatter
        TC_EditableFormatHelper.java
        TestReWriteVisitor.java
        rewriter
        TestBooleanStateStack.java
        tests
        AbstractRubyModelTest.java
        ModifyingResourceTest.java
        model
        BufferTests.java
        util
        Util.java
        util
        TS_CoreUtil.java
        UtilTest.java
        internal
        TS_Internal.java
        codeassist
        CompletionContextTest.java
        CompletionEngineTest.java
        TS_InternalCodeAssist.java
        core
        ShamResourceChangeEvent.java
        ShamResourceDelta.java
        TC_LoadPathEntry.java
        TC_RubyCore.java
        TC_RubyProject.java
        TS_InternalCore.java
        builder
        TS_InternalCoreBuilder.java
        parser
        ShamNode.java
        TC_RubyParser.java
        TC_TaskParser.java
        TS_InternalCoreParser.java
        warnings
        AbstractRubyLintVisitorTestCase.java
        ConstantReassignmentVisitorTest.java
        CoreClassReOpeningTest.java
        EmptyStatementVisitorTest.java
        Ruby19HashCommaSyntaxTest.java
        Ruby19WhenStatementsTest.java
        TS_InternalCoreParserWarnings.java
        search
        AllTests.java
        MethodPatternParserTest.java
        util
        ASTUtilTest.java
        TS_Util.java
        formatter
        AbstractCodeFormatterTestCase.java
        TC_ASTBasedCodeFormatter.java
        TC_CodeFormatter.java
        TS_InternalFormatter.java
        ti
        CombinedTypeInferrerTest.java
        DataFlowTypeInferrerTest.java
        ReferenceMatchTest.java
        TS_TypeInference.java
        TypeInferrerTest.java
        TypeInferrerTestCase.java
  - org.rubypeople.rdt.debug.core.tests
    - src
      - org
        rubypeople
        rdt
        debug
        core
        tests
        FTC_AbstractDebuggerCommunicationTest.java
        FTC_ClassicDebuggerCommunicationTest.java
        FTC_DebuggerLaunch.java
        FTC_DebuggerProxyTest.java
        FTC_ReadStrategyTest.java
        FTC_RubyDebugCommunicationTest.java
        FTC_Single.java
        FTS_Debug.java
        NonBlockingSocketReader.java
        OutputRedirectorThread.java
        RdtDebugTestsPlugin.java
        TC_RubyDebugTarget.java
        TS_UnitTests.java
        TestRubyDebugTarget.java
        TestXmlStreamReader.java
        WasteReader.java
  - org.rubypeople.rdt.debug.ui.tests
    - src
      - org
        rubypeople
        rdt
        debug
        ui
        tests
        RdtDebugUiTestsPlugin.java
        TS_DebugUi.java
        internal
        debug
        ui
        TC_RubyConsoleTracker.java
        TC_RubySourceLocator.java
        TS_InternalDebugUi.java
        launcher
        ShamApplicationLaunchConfigurationDelegate.java
        TC_RubyApplicationShortcut.java
        TC_RubyArgumentsTab.java
        TC_RubyEntryPointTab.java
        TC_RubyEnvironmentTab.java
        TS_InternalDebugUiLauncher.java
  - org.rubypeople.rdt.launching.tests
    - src
      - org
        rubypeople
        rdt
        internal
        launching
        EvaluateRubyProcessOutput.java
        ShamProcess.java
        TC_RubyInterpreter.java
        TC_RubyRuntime.java
        TC_RunnerLaunching.java
        TS_InternalLaunching.java
        TestRubyDebugDebugger.java
        TestVM.java
        TestVMDebugger.java
        TestVMRunner.java
        TestVMType.java
        launching
        tests
        TS_Launching.java
  - org.rubypeople.rdt.refactoring.tests
    - src
      - org
        rubypeople
        rdt
        refactoring
        tests
        FilePropertyData.java
        FileTestCase.java
        FileTestData.java
        FileTestSuite.java
        MultiFileTestData.java
        RefactoringConditionTestCase.java
        RefactoringTestCase.java
        TS_All.java
        TestsPlugin.java
        TreeProviderTester.java
        TwoLayerTreeEditProviderTester.java
        classnodeprovider
        ClassNodeProviderTester.java
        TC_ClassNodeProvider.java
        TC_IncludedClassesProvider.java
        TS_ClassNodeProvider.java
        core
        MultipleDocumentsInOneProvider.java
        TC_ModuleNodeProvider.java
        TC_NodeProvider.java
        TC_RefactoringConditionChecker.java
        TC_SelectionNodeProvider.java
        TS_Core.java
        convertlocaltofield
        LocalToFieldTester.java
        TS_LocalToField.java
        conditionchecks
        LocalToFieldConditionTester.java
        TS_LocalToFieldChecks.java
        encapsulatefield
        EncapsulateFieldTester.java
        TS_EncapsulateField.java
        conditionchecks
        EncapsulateFieldConditionTester.java
        TS_EncapsulateFieldChecks.java
        extractconstant
        ExtractConstantTester.java
        TS_ExtractConstant.java
        conditionchecks
        ExtractConstantConditionTester.java
        TS_ExtractConstantChecks.java
        extractmethod
        ExtractMethodTester.java
        TS_ExtractMethod.java
        conditionchecks
        ExtractMethodConditionTester.java
        TS_ExtractMethodChecks.java
        generateaccessors
        AccessorSelection.java
        GenerateAccessorTester.java
        TC_AccessorsGeneratorTreeTest.java
        TS_GenerateAccessors.java
        generateconstructor
        ConstructorGeneratorTester.java
        TC_ConstructorGeneratorTreeTest.java
        TS_GenerateConstructor.java
        inlineclass
        ClassInlinerTester.java
        TS_InlineClass.java
        conditionchecks
        InlineClassConditionTester.java
        TS_InlineClassChecks.java
        inlinelocal
        LocalInlinerTester.java
        TS_InlineLocal.java
        conditionchecks
        InlineLocalConditionTester.java
        TS_InlineLocalConditionChecks.java
        inlinemethod
        FinderTestsBase.java
        InlineMethodTester.java
        TC_MethodBodyStatementReplacer.java
        TC_MethodFinder.java
        TC_ParameterReplacer.java
        TC_RenameDuplicatedVariables.java
        TC_ReturnStatementReplacer.java
        TC_SelectedCallFinder.java
        TC_TargetClassFinder.java
        TS_InlineMethod.java
        conditions
        InlineMethodConditionTester.java
        TS_InlineMethodChecks.java
        mergeclasspartsinfile
        ClassPartSelectorTester.java
        TS_MergeClassPartsInFile.java
        conditionchecks
        MergeInFileConditionTester.java
        TS_MergeClassPartsInFileChecks.java
        mergewithexternalclassparts
        MergeWithExternalClassPartsTester.java
        TS_MergeWithExternalClassParts.java
        conditionchecks
        MergeWithExternalConditionTester.java
        TS_MergetWitExternalChecks.java
        movefield
        MoveFieldTester.java
        TS_MoveField.java
        conditionchecks
        MoveFieldConditionTester.java
        TS_MoveFieldChecks.java
        movemethod
        MoveMethodTester.java
        TS_MoveMethod.java
        conditionchecks
        MoveMethodConditionTester.java
        TS_MoveMethodChecks.java
        nodewrapper
        TC_FieldNodeWrapper.java
        TC_MethodNodeWrapper.java
        TS_NodeWrapper.java
        overridemethod
        OverrideMethodTester.java
        TC_MethodOverriderTreeTest.java
        TC_OverridenMethodEditTest.java
        TS_OverrideMethod.java
        pushdown
        PushDownTester.java
        TC_MethodDownPusherTreeTest.java
        TS_PushDown.java
        rename
        RenameTester.java
        TS_Rename.java
        renameclass
        ClassRenameTester.java
        TC_ClassFinder.java
        TC_ClassInstanciationFinder.java
        TS_RenameClass.java
        conditionchecker
        RenameClassConditionTester.java
        TS_RenameClassChecks.java
        renamefield
        FieldRenamerTester.java
        TS_RenameField.java
        conditionchecks
        RenameFieldConditionTester.java
        TS_RenameFieldChecks.java
        renamelocal
        RenameLocalTester.java
        TS_RenameLocal.java
        conditionchecks
        RenameLocalConditionTester.java
        TS_RenameLocalCondition.java
        renamemethod
        MethodRenamerTester.java
        TS_RenameMethod.java
        conditioncheck
        RenameMethodConditionTester.java
        TS_RenameMethodChecks.java
        selection
        RenameMethodSelectionTester.java
        TS_RenameMethodSelection.java
        renamemodule
        ModuleRenameTester.java
        TC_ModuleInclusionFinder.java
        TS_RenameModule.java
        conditionchecker
        RenameModuleConditionTester.java
        TS_RenameModuleChecks.java
        splitlocal
        SplitLocalTester.java
        TC_LocalVarFinder.java
        TC_SplittedVariableRenamer.java
        TS_SplitLocal.java
        conditionchecks
        SplitLocalConditionTester.java
        TS_SplitLocalChecks.java
        util
        TC_FileHelper.java
        TC_HSRFormatter.java
        TC_NameHelper.java
        TC_NameValidator.java
        TC_NodeUtil.java
        TC_StringHelper.java
        TS_Util.java
  - org.rubypeople.rdt.tests.all
    - src
      - org
        rubypeople
        rdt
        tests
        all
        TS_RdtAllFunctionalTests.java
        TS_RdtAllUnitTests.java
  - org.rubypeople.rdt.ui.tests
    - src
      - org
        rubypeople
        rdt
        internal
        corext
        util
        RDocUtiltest.java
        ui
        RdtUiTestsPlugin.java
        TC_ResourceAdapterFactory.java
        TC_RubyFileMatcher.java
        TC_StackTraceLine.java
        TS_InternalUi.java
        rubyeditor
        TC_TabConverter.java
        TS_InternalUiRubyEditor.java
        search
        MarkOccurrencesTest.java
        MockTreeViewer.java
        TS_InternalUiRubySearch.java
        text
        TC_RubyPartitionScanner.java
        TC_RubyWordFinder.java
        TS_InternalUiText.java
        TestDocumentCommand.java
        ruby
        TC_RubyAutoIndentStrategy.java
        TC_RubyTokenScanner.java
        spelling
        SpellCheckEngineTest.java
        util
        InternalUIUtilTests.java
        StringMatcherTest.java
        TwoArrayQuickSorterTest.java
        ui
        tests
        TS_Ui.java

package org.rubypeople.rdt.internal.ui.text.ruby;

import java.io.IOException;
import java.io.StringReader;

import org.eclipse.core.runtime.Preferences;
import org.eclipse.jface.text.BadLocationException;
import org.eclipse.jface.text.IDocument;
import org.eclipse.jface.text.rules.IToken;
import org.eclipse.jface.text.rules.ITokenScanner;
import org.eclipse.jface.text.rules.Token;
import org.jruby.CompatVersion;
import org.jruby.common.NullWarnings;
import org.jruby.lexer.yacc.LexerSource;
import org.jruby.lexer.yacc.RubyYaccLexer;
import org.jruby.lexer.yacc.SyntaxException;
import org.jruby.lexer.yacc.RubyYaccLexer.LexState;
import org.jruby.parser.ParserConfiguration;
import org.jruby.parser.ParserSupport;
import org.jruby.parser.RubyParserResult;
import org.jruby.parser.Tokens;
import org.jruby.util.KCode;
import org.rubypeople.rdt.internal.ui.RubyPlugin;
import org.rubypeople.rdt.ui.PreferenceConstants;

/**
 * A token scanner which returns integers for ruby tokens. These can later be mapped to colors.
 * Does some smoothing on the tokens to add additional token types that the JRuby parser ignores.
 * 
 * @author Chris Williams
 *
 */
public class RubyTokenScanner implements ITokenScanner {

	private static final int COMMA = 44;
	private static final int COLON = 58;
	private static final int NEWLINE = 10;
	public static final int CHARACTER = 128;
	static final int MIN_KEYWORD = 257;
	static final int MAX_KEYWORD = 303;

	private RubyYaccLexer lexer;
	private LexerSource lexerSource;
	private ParserSupport parserSupport;
	
	private int fTokenLength;
	private int fOffset;
	
	private boolean isInSymbol;
	private boolean inAlias;
	private RubyParserResult result;
	private int origOffset;
	private int origLength;
	private String fContents;	

	public RubyTokenScanner() {
		lexer = new RubyYaccLexer();
		parserSupport = new ParserSupport();
		ParserConfiguration config = new ParserConfiguration(KCode.NIL, 0, true, false, CompatVersion.RUBY1_8);
		parserSupport.setConfiguration(config);
		result = new RubyParserResult();
		parserSupport.setResult(result);
		lexer.setParserSupport(parserSupport);
		lexer.setWarnings(new NullWarnings());
		lexer.setEncoding(config.getKCode().getEncoding());
	}

	public int getTokenLength() {
		return fTokenLength;
	}

	public int getTokenOffset() {
		return fOffset;
	}

	public IToken nextToken() {
		fOffset = getOffset();
		fTokenLength = 0;
		IToken returnValue = new Token(Tokens.tIDENTIFIER);
		boolean isEOF = false;
		try {
			isEOF = !lexer.advance(); // FIXME if we're assigning a string to a variable we may get a NumberFormatException here!
			if (isEOF) {
				returnValue = Token.EOF;
			} else {
				fTokenLength = getOffset() - fOffset;
				returnValue = token(lexer.token());
			}
		} catch (SyntaxException se) {
			if (lexerSource.getOffset() - origLength == 0)
				return Token.EOF; // return eof if we hit a problem found at
									// end of parsing			
			fTokenLength = getOffset() - fOffset;
			return token(Tokens.yyErrorCode); // FIXME This should return a special error token!
		} catch (NumberFormatException nfe) {
			fTokenLength = getOffset() - fOffset;
			return returnValue;
		} catch (IOException e) {
			RubyPlugin.log(e);
		}
		
		return returnValue;
	}

	private int getOffset() {
		return lexerSource.getOffset() + origOffset;
	}

	private IToken token(int i) {		
		
		if (isInSymbol) {
			if (isSymbolTerminator(i)) {
				isInSymbol = false; // we're at the end of the symbol
				if (shouldReturnDefault(i))
					return new Token(new Integer(i));				
			}
			return new Token(new Integer(Tokens.tSYMBEG));
		}
		// The next two conditionals work around a JRuby parsing bug
		// JRuby returns the number for ':' on second symbol's beginning in alias calls
		if (i == Tokens.kALIAS) {
			inAlias = true;
		}
		if (i == COLON && inAlias) {
			isInSymbol = true;
			inAlias = false;
			return new Token(new Integer(Tokens.tSYMBEG));
		} // end JRuby parsing hack for alias
		if (isKeyword(i))
			return new Token(new Integer(Tokens.k__FILE__)); // FIXME Set up a token for user defined keywords
		switch (i) {
		case Tokens.tSYMBEG:
			if (looksLikeTertiaryConditionalWithNoSpaces()) {
				return new Token(new Integer(Tokens.tCOLON2));
			}
			isInSymbol = true;
			 // FIXME Set up a token for symbols
			return new Token(new Integer(Tokens.tSYMBEG));
		case Tokens.tGVAR:
		case Tokens.tBACK_REF:
			return new Token(new Integer(Tokens.tGVAR));
		case Tokens.tFLOAT:
		case Tokens.tINTEGER:
			// A character is marked as an integer, lets check for that special case...
			if ((((fOffset - origOffset) + 1) < fContents.length()) && (fContents.charAt((fOffset - origOffset) + 1) == '?'))
				return new Token(new Integer(CHARACTER));
			return new Token(new Integer(i));
		default:
			return new Token(new Integer(i));
		}
	}

	private boolean looksLikeTertiaryConditionalWithNoSpaces() {
		if (fTokenLength > 1) return false;
		int index = (fOffset - origOffset) - 1;
		if (index < 0) return false;
		try {
			char c = fContents.charAt(index);
			return !Character.isWhitespace(c) && Character.isUnicodeIdentifierPart(c);
		} catch (RuntimeException e) {
			return false;
		}
	}

	private boolean shouldReturnDefault(int i) {
		switch (i) {
		case NEWLINE:
		case COMMA:
		case Tokens.tASSOC:
		case Tokens.tRPAREN:
			return true;
		default:
			return false;
		}
	}

	private boolean isSymbolTerminator(int i) {
		if (isRealKeyword(i)) return true;
		switch (i) {
		case Tokens.tAREF:
		case Tokens.tCVAR:
		case Tokens.tMINUS:
		case Tokens.tPLUS:
		case Tokens.tPIPE:
		case Tokens.tCARET:
		case Tokens.tLT:
		case Tokens.tGT:
		case Tokens.tAMPER:
		case Tokens.tSTAR2:
		case Tokens.tDIVIDE:
		case Tokens.tPERCENT:
		case Tokens.tBACK_REF2:
		case Tokens.tTILDE:
		case Tokens.tCONSTANT: 
		case Tokens.tFID:
		case Tokens.tASET:
		case Tokens.tIDENTIFIER: 
		case Tokens.tIVAR:
		case Tokens.tGVAR:
		case Tokens.tASSOC:
		case Tokens.tLSHFT:
		case Tokens.tRPAREN:
		case COMMA:
		case NEWLINE:
			return true;
		default:
			return false;
		}
	}

	private boolean isRealKeyword(int i) {
		if (i >= MIN_KEYWORD && i <= MAX_KEYWORD) return true;
		return false;
	}

	private boolean isKeyword(int i) {
		if (i != Tokens.tIDENTIFIER) return false;
		String src;
		try {
			src = fContents.substring((fOffset - origOffset), (fOffset - origOffset) + fTokenLength);
		} catch (RuntimeException e) {
			RubyPlugin.log(e);
			return false;
		}
		if (src == null || src.trim().length() == 0) return false;
		Preferences prefs = RubyPlugin.getDefault().getPluginPreferences();
		if (prefs == null) return false;
		String rawKeywords = prefs.getString(PreferenceConstants.EDITOR_USER_KEYWORDS);
		if (rawKeywords == null || rawKeywords.length() == 0) {
			return false;
		}
		String[] keywords = rawKeywords.split(",");
		if (keywords == null || keywords.length == 0) {
			return false;
		}
		for (int j = 0; j < keywords.length; j++) {
			if (keywords[j] == null) continue;
			if (keywords[j].equals(src.trim())) return true;
		}
		return false;
	}

	public void setRange(IDocument document, int offset, int length) {
		lexer.reset();
		lexer.setState(LexState.EXPR_BEG);
		parserSupport.initTopLocalVariables();
		isInSymbol = false;
		ParserConfiguration config = new ParserConfiguration(KCode.NIL, 0, true, false, CompatVersion.RUBY1_8);
		try {
			fContents = document.get(offset, length);			
			lexerSource = LexerSource.getSource("filename", new StringReader(fContents), null, config);
			lexer.setSource(lexerSource);
		} catch (BadLocationException e) {
			lexerSource = LexerSource.getSource("filename", new StringReader(""), null, config);
			lexer.setSource(lexerSource);
		}
		origOffset = offset;
		origLength = length;
	}
}