XpandLexer.java example

Explorer
gmf-tooling-master
/*
 * Copyright (c) 2006, 2009 Borland Software Corporation and others.
 * All rights reserved.   This program and the accompanying materials
 * are made available under the terms of the Eclipse Public License v1.0
 * which accompanies this distribution, and is available at
 * http://www.eclipse.org/legal/epl-v10.html
 *
 * Contributors:
 *     committers of openArchitectureWare - Xpand language syntax
 *     Artem Tikhomirov (Borland) - LALR grammar
 *                                - Migration to OCL expressions
 */
package org.eclipse.gmf.internal.xpand.parser;

import java.util.LinkedList;
import java.util.List;

import lpg.runtime.LexParser;
import lpg.runtime.LexStream;
import lpg.runtime.LpgLexStream;
import lpg.runtime.Monitor;
import lpg.runtime.ParseTable;
import lpg.runtime.PrsStream;
import lpg.runtime.RuleAction;

import org.eclipse.gmf.internal.xpand.util.ParserException.ErrorLocationInfo;

public class XpandLexer extends LpgLexStream implements XpandParsersym, XpandLexersym, RuleAction {

	private static ParseTable prs = new XpandLexerprs();

	private PrsStream prsStream;

	private final LexParser lexParser = new LexParser(this, prs, this);

	private XpandKWLexer kwLexer;

	public PrsStream getPrsStream() {
		return prsStream;
	}

	public int getToken(int i) {
		return lexParser.getToken(i);
	}

	public int getRhsFirstTokenIndex(int i) {
		return lexParser.getFirstToken(i);
	}

	public int getRhsLastTokenIndex(int i) {
		return lexParser.getLastToken(i);
	}

	public int getLeftSpan() {
		return lexParser.getFirstToken();
	}

	public int getRightSpan() {
		return lexParser.getLastToken();
	}

	public XpandLexer(char[] input_chars, String filename, int tab) {
		super(input_chars, filename, tab);
	}

	public XpandLexer(char[] input_chars, String filename) {
		this(input_chars, filename, 4);
	}

	public String[] orderedExportedSymbols() {
		return XpandParsersym.orderedTerminalSymbols;
	}

	public LexStream getLexStream() {
		return (LexStream) this;
	}

	public int[] getKeywordKinds() {
		return kwLexer.getKeywordKinds();
	}

	public void lexer(PrsStream prsStream) {
		lexer(null, prsStream);
	}

	public void lexer(Monitor monitor, PrsStream prsStream) {
		if (getInputChars() == null) {
			throw new NullPointerException("LexStream was not initialized");
		}

		this.prsStream = prsStream;
		resetErrors();

		prsStream.makeToken(0, 0, 0); // Token list must start with a bad token

		lexParser.parseCharacters(monitor); // Lex the input characters

		int i = getStreamIndex();
		prsStream.makeToken(i, i, XpandParsersym.TK_EOF_TOKEN); // and end with
																// the end of
																// file token
		prsStream.setStreamLength(prsStream.getSize());

		return;
	}

	@Override
	public void initialize(char[] content, String filename) {
		super.initialize(content, filename);
		if (this.kwLexer == null) {
			this.kwLexer = new XpandKWLexer(getInputChars(), XpandParsersym.TK_IDENTIFIER);
		} else {
			this.kwLexer.setInputChars(getInputChars());
		}
	}

	final void makeToken(int kind) {
		int startOffset = getLeftSpan(), endOffset = getRightSpan();
		makeToken(startOffset, endOffset, kind);
	}

	final void makeComment(int kind) {
		int startOffset = getLeftSpan(), endOffset = getRightSpan();
		super.getPrsStream().makeAdjunct(startOffset, endOffset, kind);
	}

	final void skipToken() {
	}

	final void checkForKeyWord() {
		int startOffset = getLeftSpan(), endOffset = getRightSpan(), kwKind = kwLexer.lexer(startOffset, endOffset);
		makeToken(startOffset, endOffset, kwKind);
	}

	// aux data for getKind method
	private final int tokenKind[] = { Char_CtlCharNotWS, // 000 0x00
			Char_CtlCharNotWS, // 001 0x01
			Char_CtlCharNotWS, // 002 0x02
			Char_CtlCharNotWS, // 003 0x03
			Char_CtlCharNotWS, // 004 0x04
			Char_CtlCharNotWS, // 005 0x05
			Char_CtlCharNotWS, // 006 0x06
			Char_CtlCharNotWS, // 007 0x07
			Char_CtlCharNotWS, // 008 0x08
			Char_HT, // 009 0x09
			Char_LF, // 010 0x0A
			Char_CtlCharNotWS, // 011 0x0B
			Char_FF, // 012 0x0C
			Char_CR, // 013 0x0D
			Char_CtlCharNotWS, // 014 0x0E
			Char_CtlCharNotWS, // 015 0x0F
			Char_CtlCharNotWS, // 016 0x10
			Char_CtlCharNotWS, // 017 0x11
			Char_CtlCharNotWS, // 018 0x12
			Char_CtlCharNotWS, // 019 0x13
			Char_CtlCharNotWS, // 020 0x14
			Char_CtlCharNotWS, // 021 0x15
			Char_CtlCharNotWS, // 022 0x16
			Char_CtlCharNotWS, // 023 0x17
			Char_CtlCharNotWS, // 024 0x18
			Char_CtlCharNotWS, // 025 0x19
			Char_CtlCharNotWS, // 026 0x1A
			Char_CtlCharNotWS, // 027 0x1B
			Char_CtlCharNotWS, // 028 0x1C
			Char_CtlCharNotWS, // 029 0x1D
			Char_CtlCharNotWS, // 030 0x1E
			Char_CtlCharNotWS, // 031 0x1F
			Char_Space, // 032 0x20
			Char_Exclamation, // 033 0x21
			Char_DoubleQuote, // 034 0x22
			Char_Sharp, // 035 0x23
			Char_DollarSign, // 036 0x24
			Char_Percent, // 037 0x25
			Char_Ampersand, // 038 0x26
			Char_SingleQuote, // 039 0x27
			Char_LeftParen, // 040 0x28
			Char_RightParen, // 041 0x29
			Char_Star, // 042 0x2A
			Char_Plus, // 043 0x2B
			Char_Comma, // 044 0x2C
			Char_Minus, // 045 0x2D
			Char_Dot, // 046 0x2E
			Char_Slash, // 047 0x2F
			Char_0, // 048 0x30
			Char_1, // 049 0x31
			Char_2, // 050 0x32
			Char_3, // 051 0x33
			Char_4, // 052 0x34
			Char_5, // 053 0x35
			Char_6, // 054 0x36
			Char_7, // 055 0x37
			Char_8, // 056 0x38
			Char_9, // 057 0x39
			Char_Colon, // 058 0x3A
			Char_SemiColon, // 059 0x3B
			Char_LessThan, // 060 0x3C
			Char_Equal, // 061 0x3D
			Char_GreaterThan, // 062 0x3E
			Char_QuestionMark, // 063 0x3F
			Char_AtSign, // 064 0x40
			Char_A, // 065 0x41
			Char_B, // 066 0x42
			Char_C, // 067 0x43
			Char_D, // 068 0x44
			Char_E, // 069 0x45
			Char_F, // 070 0x46
			Char_G, // 071 0x47
			Char_H, // 072 0x48
			Char_I, // 073 0x49
			Char_J, // 074 0x4A
			Char_K, // 075 0x4B
			Char_L, // 076 0x4C
			Char_M, // 077 0x4D
			Char_N, // 078 0x4E
			Char_O, // 079 0x4F
			Char_P, // 080 0x50
			Char_Q, // 081 0x51
			Char_R, // 082 0x52
			Char_S, // 083 0x53
			Char_T, // 084 0x54
			Char_U, // 085 0x55
			Char_V, // 086 0x56
			Char_W, // 087 0x57
			Char_X, // 088 0x58
			Char_Y, // 089 0x59
			Char_Z, // 090 0x5A
			Char_LeftBracket, // 091 0x5B
			Char_BackSlash, // 092 0x5C
			Char_RightBracket, // 093 0x5D
			Char_Caret, // 094 0x5E
			Char__, // 095 0x5F
			Char_BackQuote, // 096 0x60
			Char_a, // 097 0x61
			Char_b, // 098 0x62
			Char_c, // 099 0x63
			Char_d, // 100 0x64
			Char_e, // 101 0x65
			Char_f, // 102 0x66
			Char_g, // 103 0x67
			Char_h, // 104 0x68
			Char_i, // 105 0x69
			Char_j, // 106 0x6A
			Char_k, // 107 0x6B
			Char_l, // 108 0x6C
			Char_m, // 109 0x6D
			Char_n, // 110 0x6E
			Char_o, // 111 0x6F
			Char_p, // 112 0x70
			Char_q, // 113 0x71
			Char_r, // 114 0x72
			Char_s, // 115 0x73
			Char_t, // 116 0x74
			Char_u, // 117 0x75
			Char_v, // 118 0x76
			Char_w, // 119 0x77
			Char_x, // 120 0x78
			Char_y, // 121 0x79
			Char_z, // 122 0x7A
			Char_LeftBrace, // 123 0x7B
			Char_VerticalBar, // 124 0x7C
			Char_RightBrace, // 125 0x7D
			Char_Tilde, // 126 0x7E
						// [artem] As I understand, there's no need to specify
						// characters other than those
						// we'll try to access by index from getKind method
						// (iow, this array is auxilary
						// as I indicated in its comment). Thus, there seems to
						// be no reason to specify
						// Char_Acute here as it's done in OCL's LexerBasicMap.g
			Char_AfterASCII, // for all chars in range 128..65534
			Char_EOF // for '\uffff' or 65535
	};

	// Classify character at ith location
	@Override
	public final int getKind(int i) {
		char c = (i >= getStreamLength() ? '\uffff' : getCharValue(i));
		return (c < 128 // ASCII Character
		? tokenKind[c]
				: c == '\uffff' ? Char_EOF : getNonAsciiKind(c));

	}

	private final static int getNonAsciiKind(char c) {
		if (c == '\u00AB') {
			return Char_LG;
		}
		if (c == '\u00BB') {
			return Char_RG;
		}
		if (c == '\u00b4') {
			return Char_Acute; // For OCLLexer
		}
		return Char_AfterASCII;

	}

	public ErrorLocationInfo[] getErrors() {
		return errors.toArray(new ErrorLocationInfo[errors.size()]);
	}

	private void resetErrors() {
		errors.clear();
	}

	private final List<ErrorLocationInfo> errors = new LinkedList<ErrorLocationInfo>();

	@Override
	public void reportError(int errorCode, int leftToken, int errorToken, int rightToken, String errorInfo[]) {
		StringBuilder sb = new StringBuilder("(");
		sb.append(errorCode);
		sb.append(") ");
		if (errorInfo != null) {
			for (int i = 0; i < errorInfo.length; i++) {
				if (sb.length() > 0) {
					sb.append("; ");
				}
				sb.append(errorInfo[i]);
			}
		}
		errors.add(new ErrorLocationInfo(sb.toString(), getLine(leftToken), getColumn(leftToken), getEndLine(rightToken), getEndColumn(rightToken)));
	}

	public void ruleAction(int ruleNumber) {
		switch (ruleNumber) {

		//
		// Rule 1: Token ::= Identifier
		//
		case 1: {
			checkForKeyWord();
			break;
		}

			//
			// Rule 2: Token ::= SingleQuote SLNotSQOpt SingleQuote
			//
		case 2: {
			makeToken(XpandParsersym.TK_STRING_LITERAL);
			break;
		}

			//
			// Rule 3: Token ::= Acute SLNotSQOpt Acute
			//
		case 3: {
			makeToken(XpandParsersym.TK_STRING_LITERAL);
			break;
		}

			//
			// Rule 4: Token ::= BackQuote SLNotSQOpt Acute
			//
		case 4: {
			makeToken(XpandParsersym.TK_STRING_LITERAL);
			break;
		}

			//
			// Rule 5: Token ::= IntegerLiteral
			//
		case 5:
			break;

		//
		// Rule 6: Token ::= IntegerLiteral DotToken
		//
		case 6:
			break;

		//
		// Rule 7: Token ::= IntegerLiteral DotDotToken
		//
		case 7:
			break;

		//
		// Rule 8: Token ::= RealLiteral
		//
		case 8: {
			makeToken(XpandParsersym.TK_REAL_LITERAL);
			break;
		}

			//
			// Rule 9: Token ::= SLC
			//
		case 9: {
			makeComment(XpandParsersym.TK_SINGLE_LINE_COMMENT);
			break;
		}

			//
			// Rule 10: Token ::= / * Inside Stars /
			//
		case 10: {
			makeComment(XpandParsersym.TK_MULTI_LINE_COMMENT);
			break;
		}

			//
			// Rule 11: Token ::= WS
			//
		case 11: {
			skipToken();
			break;
		}

			//
			// Rule 12: Token ::= +
			//
		case 12: {
			makeToken(XpandParsersym.TK_PLUS);
			break;
		}

			//
			// Rule 13: Token ::= -
			//
		case 13: {
			makeToken(XpandParsersym.TK_MINUS);
			break;
		}

			//
			// Rule 14: Token ::= *
			//
		case 14: {
			makeToken(XpandParsersym.TK_MULTIPLY);
			break;
		}

			//
			// Rule 15: Token ::= /
			//
		case 15: {
			makeToken(XpandParsersym.TK_DIVIDE);
			break;
		}

			//
			// Rule 16: Token ::= (
			//
		case 16: {
			makeToken(XpandParsersym.TK_LPAREN);
			break;
		}

			//
			// Rule 17: Token ::= )
			//
		case 17: {
			makeToken(XpandParsersym.TK_RPAREN);
			break;
		}

			//
			// Rule 18: Token ::= >
			//
		case 18: {
			makeToken(XpandParsersym.TK_GREATER);
			break;
		}

			//
			// Rule 19: Token ::= <
			//
		case 19: {
			makeToken(XpandParsersym.TK_LESS);
			break;
		}

			//
			// Rule 20: Token ::= =
			//
		case 20: {
			makeToken(XpandParsersym.TK_EQUAL);
			break;
		}

			//
			// Rule 21: Token ::= > =
			//
		case 21: {
			makeToken(XpandParsersym.TK_GREATER_EQUAL);
			break;
		}

			//
			// Rule 22: Token ::= < =
			//
		case 22: {
			makeToken(XpandParsersym.TK_LESS_EQUAL);
			break;
		}

			//
			// Rule 23: Token ::= < >
			//
		case 23: {
			makeToken(XpandParsersym.TK_NOT_EQUAL);
			break;
		}

			//
			// Rule 24: Token ::= [
			//
		case 24: {
			makeToken(XpandParsersym.TK_LBRACKET);
			break;
		}

			//
			// Rule 25: Token ::= ]
			//
		case 25: {
			makeToken(XpandParsersym.TK_RBRACKET);
			break;
		}

			//
			// Rule 26: Token ::= {
			//
		case 26: {
			makeToken(XpandParsersym.TK_LBRACE);
			break;
		}

			//
			// Rule 27: Token ::= }
			//
		case 27: {
			makeToken(XpandParsersym.TK_RBRACE);
			break;
		}

			//
			// Rule 28: Token ::= - >
			//
		case 28: {
			makeToken(XpandParsersym.TK_ARROW);
			break;
		}

			//
			// Rule 29: Token ::= |
			//
		case 29: {
			makeToken(XpandParsersym.TK_BAR);
			break;
		}

			//
			// Rule 30: Token ::= ,
			//
		case 30: {
			makeToken(XpandParsersym.TK_COMMA);
			break;
		}

			//
			// Rule 31: Token ::= :
			//
		case 31: {
			makeToken(XpandParsersym.TK_COLON);
			break;
		}

			//
			// Rule 32: Token ::= : :
			//
		case 32: {
			makeToken(XpandParsersym.TK_COLONCOLON);
			break;
		}

			//
			// Rule 33: Token ::= ;
			//
		case 33: {
			makeToken(XpandParsersym.TK_SEMICOLON);
			break;
		}

			//
			// Rule 34: Token ::= DotToken
			//
		case 34:
			break;

		//
		// Rule 35: DotToken ::= .
		//
		case 35: {
			makeToken(XpandParsersym.TK_DOT);
			break;
		}

			//
			// Rule 36: Token ::= DotDotToken
			//
		case 36:
			break;

		//
		// Rule 37: DotDotToken ::= . .
		//
		case 37: {
			makeToken(XpandParsersym.TK_DOTDOT);
			break;
		}

			//
			// Rule 38: IntegerLiteral ::= Integer
			//
		case 38: {
			makeToken(XpandParsersym.TK_INTEGER_LITERAL);
			break;
		}

			//
			// Rule 263: Token ::= : =
			//
		case 263: {
			makeToken(XpandParsersym.TK_RESET_ASSIGN);
			break;
		}

			//
			// Rule 264: Token ::= + =
			//
		case 264: {
			makeToken(XpandParsersym.TK_ADD_ASSIGN);
			break;
		}

			//
			// Rule 265: Token ::= !
			//
		case 265: {
			makeToken(XpandParsersym.TK_EXCLAMATION_MARK);
			break;
		}

			//
			// Rule 266: Token ::= : : =
			//
		case 266: {
			makeToken(XpandParsersym.TK_COLONCOLONEQUAL);
			break;
		}

			//
			// Rule 267: Token ::= ?
			//
		case 267: {
			makeToken(XpandParsersym.TK_QUESTIONMARK);
			break;
		}

			//
			// Rule 274: Token ::= DoubleQuote SLNotDQOpt DoubleQuote
			//
		case 274: {
			makeToken(XpandParsersym.TK_STRING_LITERAL);
			break;
		}

			//
			// Rule 278: Token ::= < <
			//
		case 278: {
			makeToken(XpandParsersym.TK_STEREOTYPE_QUALIFIER_OPEN);
			break;
		}

			//
			// Rule 279: Token ::= > >
			//
		case 279: {
			makeToken(XpandParsersym.TK_STEREOTYPE_QUALIFIER_CLOSE);
			break;
		}

			//
			// Rule 280: Token ::= . . .
			//
		case 280: {
			makeToken(XpandParsersym.TK_MULTIPLICITY_RANGE);
			break;
		}

			//
			// Rule 281: Token ::= ~
			//
		case 281: {
			makeToken(XpandParsersym.TK_TILDE_SIGN);
			break;
		}

			//
			// Rule 282: Token ::= ! =
			//
		case 282: {
			makeToken(XpandParsersym.TK_NOT_EQUAL_EXEQ);
			break;
		}

			//
			// Rule 283: Token ::= @
			//
		case 283: {
			makeToken(XpandParsersym.TK_AT_SIGN);
			break;
		}

			//
			// Rule 284: Token ::= LG
			//
		case 284: {
			makeToken(XpandParsersym.TK_LG);
			break;
		}
			//
			// Rule 285: Token ::= RG textAny lgOpt
			//
		case 285: {
			makeToken(XpandParsersym.TK_TEXT);
			break;
		}
			//
			// Rule 295: Token ::= R E M RG commentAny lgPlus E N D R E M
			//
		case 295: {
			skipToken();
			break;
		}

		default:
			break;
		}
		return;
	}
}