/* * Copyright (c) 2006, 2009 Borland Software Corporation and others. * All rights reserved. This program and the accompanying materials * are made available under the terms of the Eclipse Public License v1.0 * which accompanies this distribution, and is available at * http://www.eclipse.org/legal/epl-v10.html * * Contributors: * committers of openArchitectureWare - Xpand language syntax * Artem Tikhomirov (Borland) - LALR grammar * - Migration to OCL expressions */ package org.eclipse.gmf.internal.xpand.parser; import java.util.LinkedList; import java.util.List; import lpg.runtime.LexParser; import lpg.runtime.LexStream; import lpg.runtime.LpgLexStream; import lpg.runtime.Monitor; import lpg.runtime.ParseTable; import lpg.runtime.PrsStream; import lpg.runtime.RuleAction; import org.eclipse.gmf.internal.xpand.util.ParserException.ErrorLocationInfo; public class XpandLexer extends LpgLexStream implements XpandParsersym, XpandLexersym, RuleAction { private static ParseTable prs = new XpandLexerprs(); private PrsStream prsStream; private final LexParser lexParser = new LexParser(this, prs, this); private XpandKWLexer kwLexer; public PrsStream getPrsStream() { return prsStream; } public int getToken(int i) { return lexParser.getToken(i); } public int getRhsFirstTokenIndex(int i) { return lexParser.getFirstToken(i); } public int getRhsLastTokenIndex(int i) { return lexParser.getLastToken(i); } public int getLeftSpan() { return lexParser.getFirstToken(); } public int getRightSpan() { return lexParser.getLastToken(); } public XpandLexer(char[] input_chars, String filename, int tab) { super(input_chars, filename, tab); } public XpandLexer(char[] input_chars, String filename) { this(input_chars, filename, 4); } public String[] orderedExportedSymbols() { return XpandParsersym.orderedTerminalSymbols; } public LexStream getLexStream() { return (LexStream) this; } public int[] getKeywordKinds() { return kwLexer.getKeywordKinds(); } public void lexer(PrsStream prsStream) { lexer(null, prsStream); } public void lexer(Monitor monitor, PrsStream prsStream) { if (getInputChars() == null) { throw new NullPointerException("LexStream was not initialized"); } this.prsStream = prsStream; resetErrors(); prsStream.makeToken(0, 0, 0); // Token list must start with a bad token lexParser.parseCharacters(monitor); // Lex the input characters int i = getStreamIndex(); prsStream.makeToken(i, i, XpandParsersym.TK_EOF_TOKEN); // and end with // the end of // file token prsStream.setStreamLength(prsStream.getSize()); return; } @Override public void initialize(char[] content, String filename) { super.initialize(content, filename); if (this.kwLexer == null) { this.kwLexer = new XpandKWLexer(getInputChars(), XpandParsersym.TK_IDENTIFIER); } else { this.kwLexer.setInputChars(getInputChars()); } } final void makeToken(int kind) { int startOffset = getLeftSpan(), endOffset = getRightSpan(); makeToken(startOffset, endOffset, kind); } final void makeComment(int kind) { int startOffset = getLeftSpan(), endOffset = getRightSpan(); super.getPrsStream().makeAdjunct(startOffset, endOffset, kind); } final void skipToken() { } final void checkForKeyWord() { int startOffset = getLeftSpan(), endOffset = getRightSpan(), kwKind = kwLexer.lexer(startOffset, endOffset); makeToken(startOffset, endOffset, kwKind); } // aux data for getKind method private final int tokenKind[] = { Char_CtlCharNotWS, // 000 0x00 Char_CtlCharNotWS, // 001 0x01 Char_CtlCharNotWS, // 002 0x02 Char_CtlCharNotWS, // 003 0x03 Char_CtlCharNotWS, // 004 0x04 Char_CtlCharNotWS, // 005 0x05 Char_CtlCharNotWS, // 006 0x06 Char_CtlCharNotWS, // 007 0x07 Char_CtlCharNotWS, // 008 0x08 Char_HT, // 009 0x09 Char_LF, // 010 0x0A Char_CtlCharNotWS, // 011 0x0B Char_FF, // 012 0x0C Char_CR, // 013 0x0D Char_CtlCharNotWS, // 014 0x0E Char_CtlCharNotWS, // 015 0x0F Char_CtlCharNotWS, // 016 0x10 Char_CtlCharNotWS, // 017 0x11 Char_CtlCharNotWS, // 018 0x12 Char_CtlCharNotWS, // 019 0x13 Char_CtlCharNotWS, // 020 0x14 Char_CtlCharNotWS, // 021 0x15 Char_CtlCharNotWS, // 022 0x16 Char_CtlCharNotWS, // 023 0x17 Char_CtlCharNotWS, // 024 0x18 Char_CtlCharNotWS, // 025 0x19 Char_CtlCharNotWS, // 026 0x1A Char_CtlCharNotWS, // 027 0x1B Char_CtlCharNotWS, // 028 0x1C Char_CtlCharNotWS, // 029 0x1D Char_CtlCharNotWS, // 030 0x1E Char_CtlCharNotWS, // 031 0x1F Char_Space, // 032 0x20 Char_Exclamation, // 033 0x21 Char_DoubleQuote, // 034 0x22 Char_Sharp, // 035 0x23 Char_DollarSign, // 036 0x24 Char_Percent, // 037 0x25 Char_Ampersand, // 038 0x26 Char_SingleQuote, // 039 0x27 Char_LeftParen, // 040 0x28 Char_RightParen, // 041 0x29 Char_Star, // 042 0x2A Char_Plus, // 043 0x2B Char_Comma, // 044 0x2C Char_Minus, // 045 0x2D Char_Dot, // 046 0x2E Char_Slash, // 047 0x2F Char_0, // 048 0x30 Char_1, // 049 0x31 Char_2, // 050 0x32 Char_3, // 051 0x33 Char_4, // 052 0x34 Char_5, // 053 0x35 Char_6, // 054 0x36 Char_7, // 055 0x37 Char_8, // 056 0x38 Char_9, // 057 0x39 Char_Colon, // 058 0x3A Char_SemiColon, // 059 0x3B Char_LessThan, // 060 0x3C Char_Equal, // 061 0x3D Char_GreaterThan, // 062 0x3E Char_QuestionMark, // 063 0x3F Char_AtSign, // 064 0x40 Char_A, // 065 0x41 Char_B, // 066 0x42 Char_C, // 067 0x43 Char_D, // 068 0x44 Char_E, // 069 0x45 Char_F, // 070 0x46 Char_G, // 071 0x47 Char_H, // 072 0x48 Char_I, // 073 0x49 Char_J, // 074 0x4A Char_K, // 075 0x4B Char_L, // 076 0x4C Char_M, // 077 0x4D Char_N, // 078 0x4E Char_O, // 079 0x4F Char_P, // 080 0x50 Char_Q, // 081 0x51 Char_R, // 082 0x52 Char_S, // 083 0x53 Char_T, // 084 0x54 Char_U, // 085 0x55 Char_V, // 086 0x56 Char_W, // 087 0x57 Char_X, // 088 0x58 Char_Y, // 089 0x59 Char_Z, // 090 0x5A Char_LeftBracket, // 091 0x5B Char_BackSlash, // 092 0x5C Char_RightBracket, // 093 0x5D Char_Caret, // 094 0x5E Char__, // 095 0x5F Char_BackQuote, // 096 0x60 Char_a, // 097 0x61 Char_b, // 098 0x62 Char_c, // 099 0x63 Char_d, // 100 0x64 Char_e, // 101 0x65 Char_f, // 102 0x66 Char_g, // 103 0x67 Char_h, // 104 0x68 Char_i, // 105 0x69 Char_j, // 106 0x6A Char_k, // 107 0x6B Char_l, // 108 0x6C Char_m, // 109 0x6D Char_n, // 110 0x6E Char_o, // 111 0x6F Char_p, // 112 0x70 Char_q, // 113 0x71 Char_r, // 114 0x72 Char_s, // 115 0x73 Char_t, // 116 0x74 Char_u, // 117 0x75 Char_v, // 118 0x76 Char_w, // 119 0x77 Char_x, // 120 0x78 Char_y, // 121 0x79 Char_z, // 122 0x7A Char_LeftBrace, // 123 0x7B Char_VerticalBar, // 124 0x7C Char_RightBrace, // 125 0x7D Char_Tilde, // 126 0x7E // [artem] As I understand, there's no need to specify // characters other than those // we'll try to access by index from getKind method // (iow, this array is auxilary // as I indicated in its comment). Thus, there seems to // be no reason to specify // Char_Acute here as it's done in OCL's LexerBasicMap.g Char_AfterASCII, // for all chars in range 128..65534 Char_EOF // for '\uffff' or 65535 }; // Classify character at ith location @Override public final int getKind(int i) { char c = (i >= getStreamLength() ? '\uffff' : getCharValue(i)); return (c < 128 // ASCII Character ? tokenKind[c] : c == '\uffff' ? Char_EOF : getNonAsciiKind(c)); } private final static int getNonAsciiKind(char c) { if (c == '\u00AB') { return Char_LG; } if (c == '\u00BB') { return Char_RG; } if (c == '\u00b4') { return Char_Acute; // For OCLLexer } return Char_AfterASCII; } public ErrorLocationInfo[] getErrors() { return errors.toArray(new ErrorLocationInfo[errors.size()]); } private void resetErrors() { errors.clear(); } private final List<ErrorLocationInfo> errors = new LinkedList<ErrorLocationInfo>(); @Override public void reportError(int errorCode, int leftToken, int errorToken, int rightToken, String errorInfo[]) { StringBuilder sb = new StringBuilder("("); sb.append(errorCode); sb.append(") "); if (errorInfo != null) { for (int i = 0; i < errorInfo.length; i++) { if (sb.length() > 0) { sb.append("; "); } sb.append(errorInfo[i]); } } errors.add(new ErrorLocationInfo(sb.toString(), getLine(leftToken), getColumn(leftToken), getEndLine(rightToken), getEndColumn(rightToken))); } public void ruleAction(int ruleNumber) { switch (ruleNumber) { // // Rule 1: Token ::= Identifier // case 1: { checkForKeyWord(); break; } // // Rule 2: Token ::= SingleQuote SLNotSQOpt SingleQuote // case 2: { makeToken(XpandParsersym.TK_STRING_LITERAL); break; } // // Rule 3: Token ::= Acute SLNotSQOpt Acute // case 3: { makeToken(XpandParsersym.TK_STRING_LITERAL); break; } // // Rule 4: Token ::= BackQuote SLNotSQOpt Acute // case 4: { makeToken(XpandParsersym.TK_STRING_LITERAL); break; } // // Rule 5: Token ::= IntegerLiteral // case 5: break; // // Rule 6: Token ::= IntegerLiteral DotToken // case 6: break; // // Rule 7: Token ::= IntegerLiteral DotDotToken // case 7: break; // // Rule 8: Token ::= RealLiteral // case 8: { makeToken(XpandParsersym.TK_REAL_LITERAL); break; } // // Rule 9: Token ::= SLC // case 9: { makeComment(XpandParsersym.TK_SINGLE_LINE_COMMENT); break; } // // Rule 10: Token ::= / * Inside Stars / // case 10: { makeComment(XpandParsersym.TK_MULTI_LINE_COMMENT); break; } // // Rule 11: Token ::= WS // case 11: { skipToken(); break; } // // Rule 12: Token ::= + // case 12: { makeToken(XpandParsersym.TK_PLUS); break; } // // Rule 13: Token ::= - // case 13: { makeToken(XpandParsersym.TK_MINUS); break; } // // Rule 14: Token ::= * // case 14: { makeToken(XpandParsersym.TK_MULTIPLY); break; } // // Rule 15: Token ::= / // case 15: { makeToken(XpandParsersym.TK_DIVIDE); break; } // // Rule 16: Token ::= ( // case 16: { makeToken(XpandParsersym.TK_LPAREN); break; } // // Rule 17: Token ::= ) // case 17: { makeToken(XpandParsersym.TK_RPAREN); break; } // // Rule 18: Token ::= > // case 18: { makeToken(XpandParsersym.TK_GREATER); break; } // // Rule 19: Token ::= < // case 19: { makeToken(XpandParsersym.TK_LESS); break; } // // Rule 20: Token ::= = // case 20: { makeToken(XpandParsersym.TK_EQUAL); break; } // // Rule 21: Token ::= > = // case 21: { makeToken(XpandParsersym.TK_GREATER_EQUAL); break; } // // Rule 22: Token ::= < = // case 22: { makeToken(XpandParsersym.TK_LESS_EQUAL); break; } // // Rule 23: Token ::= < > // case 23: { makeToken(XpandParsersym.TK_NOT_EQUAL); break; } // // Rule 24: Token ::= [ // case 24: { makeToken(XpandParsersym.TK_LBRACKET); break; } // // Rule 25: Token ::= ] // case 25: { makeToken(XpandParsersym.TK_RBRACKET); break; } // // Rule 26: Token ::= { // case 26: { makeToken(XpandParsersym.TK_LBRACE); break; } // // Rule 27: Token ::= } // case 27: { makeToken(XpandParsersym.TK_RBRACE); break; } // // Rule 28: Token ::= - > // case 28: { makeToken(XpandParsersym.TK_ARROW); break; } // // Rule 29: Token ::= | // case 29: { makeToken(XpandParsersym.TK_BAR); break; } // // Rule 30: Token ::= , // case 30: { makeToken(XpandParsersym.TK_COMMA); break; } // // Rule 31: Token ::= : // case 31: { makeToken(XpandParsersym.TK_COLON); break; } // // Rule 32: Token ::= : : // case 32: { makeToken(XpandParsersym.TK_COLONCOLON); break; } // // Rule 33: Token ::= ; // case 33: { makeToken(XpandParsersym.TK_SEMICOLON); break; } // // Rule 34: Token ::= DotToken // case 34: break; // // Rule 35: DotToken ::= . // case 35: { makeToken(XpandParsersym.TK_DOT); break; } // // Rule 36: Token ::= DotDotToken // case 36: break; // // Rule 37: DotDotToken ::= . . // case 37: { makeToken(XpandParsersym.TK_DOTDOT); break; } // // Rule 38: IntegerLiteral ::= Integer // case 38: { makeToken(XpandParsersym.TK_INTEGER_LITERAL); break; } // // Rule 263: Token ::= : = // case 263: { makeToken(XpandParsersym.TK_RESET_ASSIGN); break; } // // Rule 264: Token ::= + = // case 264: { makeToken(XpandParsersym.TK_ADD_ASSIGN); break; } // // Rule 265: Token ::= ! // case 265: { makeToken(XpandParsersym.TK_EXCLAMATION_MARK); break; } // // Rule 266: Token ::= : : = // case 266: { makeToken(XpandParsersym.TK_COLONCOLONEQUAL); break; } // // Rule 267: Token ::= ? // case 267: { makeToken(XpandParsersym.TK_QUESTIONMARK); break; } // // Rule 274: Token ::= DoubleQuote SLNotDQOpt DoubleQuote // case 274: { makeToken(XpandParsersym.TK_STRING_LITERAL); break; } // // Rule 278: Token ::= < < // case 278: { makeToken(XpandParsersym.TK_STEREOTYPE_QUALIFIER_OPEN); break; } // // Rule 279: Token ::= > > // case 279: { makeToken(XpandParsersym.TK_STEREOTYPE_QUALIFIER_CLOSE); break; } // // Rule 280: Token ::= . . . // case 280: { makeToken(XpandParsersym.TK_MULTIPLICITY_RANGE); break; } // // Rule 281: Token ::= ~ // case 281: { makeToken(XpandParsersym.TK_TILDE_SIGN); break; } // // Rule 282: Token ::= ! = // case 282: { makeToken(XpandParsersym.TK_NOT_EQUAL_EXEQ); break; } // // Rule 283: Token ::= @ // case 283: { makeToken(XpandParsersym.TK_AT_SIGN); break; } // // Rule 284: Token ::= LG // case 284: { makeToken(XpandParsersym.TK_LG); break; } // // Rule 285: Token ::= RG textAny lgOpt // case 285: { makeToken(XpandParsersym.TK_TEXT); break; } // // Rule 295: Token ::= R E M RG commentAny lgPlus E N D R E M // case 295: { skipToken(); break; } default: break; } return; } }