| /* |
| * Copyright (c) 2006, 2009 Borland Software Corporation and others. |
| * All rights reserved. This program and the accompanying materials |
| * are made available under the terms of the Eclipse Public License v1.0 |
| * which accompanies this distribution, and is available at |
| * http://www.eclipse.org/legal/epl-v10.html |
| * |
| * Contributors: |
| * committers of openArchitectureWare - Xpand language syntax |
| * Artem Tikhomirov (Borland) - LALR grammar |
| * - Migration to OCL expressions |
| */ |
| package org.eclipse.gmf.internal.xpand.parser; |
| |
| import java.util.LinkedList; |
| import java.util.List; |
| import java.util.regex.Matcher; |
| import java.util.regex.Pattern; |
| |
| import lpg.lpgjavaruntime.LexParser; |
| import lpg.lpgjavaruntime.LexStream; |
| import lpg.lpgjavaruntime.LpgLexStream; |
| import lpg.lpgjavaruntime.Monitor; |
| import lpg.lpgjavaruntime.ParseTable; |
| import lpg.lpgjavaruntime.PrsStream; |
| import lpg.lpgjavaruntime.RuleAction; |
| |
| import org.eclipse.gmf.internal.xpand.Activator; |
| import org.eclipse.gmf.internal.xpand.util.ParserException.ErrorLocationInfo; |
| |
| public class XpandLexer extends LpgLexStream implements XpandParsersym, XpandLexersym, RuleAction { |
| |
| private static ParseTable prs = new XpandLexerprs(); |
| |
| private PrsStream prsStream; |
| |
| private final LexParser lexParser = new LexParser(this, prs, this); |
| |
| private XpandKWLexer kwLexer; |
| |
| public PrsStream getPrsStream() { |
| return prsStream; |
| } |
| |
| public int getToken(int i) { |
| return lexParser.getToken(i); |
| } |
| |
| public int getRhsFirstTokenIndex(int i) { |
| return lexParser.getFirstToken(i); |
| } |
| |
| public int getRhsLastTokenIndex(int i) { |
| return lexParser.getLastToken(i); |
| } |
| |
| public int getLeftSpan() { |
| return lexParser.getFirstToken(); |
| } |
| |
| public int getRightSpan() { |
| return lexParser.getLastToken(); |
| } |
| |
| public XpandLexer(char[] input_chars, String filename, int tab) { |
| super(input_chars, filename, tab); |
| } |
| |
| public XpandLexer(char[] input_chars, String filename) { |
| this(input_chars, filename, 4); |
| } |
| |
| public String[] orderedExportedSymbols() { |
| return XpandParsersym.orderedTerminalSymbols; |
| } |
| |
| public LexStream getLexStream() { |
| return (LexStream) this; |
| } |
| |
| public int[] getKeywordKinds() { |
| return kwLexer.getKeywordKinds(); |
| } |
| |
| public void lexer(PrsStream prsStream) { |
| lexer(null, prsStream); |
| } |
| |
| public void lexer(Monitor monitor, PrsStream prsStream) { |
| if (getInputChars() == null) { |
| throw new NullPointerException("LexStream was not initialized"); |
| } |
| |
| this.prsStream = prsStream; |
| resetErrors(); |
| |
| prsStream.makeToken(0, 0, 0); // Token list must start with a bad token |
| |
| lexParser.parseCharacters(monitor); // Lex the input characters |
| |
| int i = getStreamIndex(); |
| prsStream.makeToken(i, i, TK_EOF_TOKEN); // and end with the end of file |
| // token |
| prsStream.setStreamLength(prsStream.getSize()); |
| |
| return; |
| } |
| |
| @Override |
| public void initialize(char[] content, String filename) { |
| super.initialize(content, filename); |
| if (this.kwLexer == null) { |
| this.kwLexer = new XpandKWLexer(getInputChars(), TK_IDENTIFIER); |
| } else { |
| this.kwLexer.setInputChars(getInputChars()); |
| } |
| } |
| |
| final void makeToken(int kind) { |
| int startOffset = getLeftSpan(), endOffset = getRightSpan(); |
| makeToken(startOffset, endOffset, kind); |
| } |
| |
| final void makeComment(int kind) { |
| int startOffset = getLeftSpan(), endOffset = getRightSpan(); |
| super.getPrsStream().makeAdjunct(startOffset, endOffset, kind); |
| } |
| |
| final void skipToken() { |
| } |
| |
| final void checkForKeyWord() { |
| int startOffset = getLeftSpan(), endOffset = getRightSpan(), kwKind = kwLexer.lexer(startOffset, endOffset); |
| makeToken(startOffset, endOffset, kwKind); |
| } |
| |
| // aux data for getKind method |
| private final int tokenKind[] = { Char_CtlCharNotWS, // 000 0x00 |
| Char_CtlCharNotWS, // 001 0x01 |
| Char_CtlCharNotWS, // 002 0x02 |
| Char_CtlCharNotWS, // 003 0x03 |
| Char_CtlCharNotWS, // 004 0x04 |
| Char_CtlCharNotWS, // 005 0x05 |
| Char_CtlCharNotWS, // 006 0x06 |
| Char_CtlCharNotWS, // 007 0x07 |
| Char_CtlCharNotWS, // 008 0x08 |
| Char_HT, // 009 0x09 |
| Char_LF, // 010 0x0A |
| Char_CtlCharNotWS, // 011 0x0B |
| Char_FF, // 012 0x0C |
| Char_CR, // 013 0x0D |
| Char_CtlCharNotWS, // 014 0x0E |
| Char_CtlCharNotWS, // 015 0x0F |
| Char_CtlCharNotWS, // 016 0x10 |
| Char_CtlCharNotWS, // 017 0x11 |
| Char_CtlCharNotWS, // 018 0x12 |
| Char_CtlCharNotWS, // 019 0x13 |
| Char_CtlCharNotWS, // 020 0x14 |
| Char_CtlCharNotWS, // 021 0x15 |
| Char_CtlCharNotWS, // 022 0x16 |
| Char_CtlCharNotWS, // 023 0x17 |
| Char_CtlCharNotWS, // 024 0x18 |
| Char_CtlCharNotWS, // 025 0x19 |
| Char_CtlCharNotWS, // 026 0x1A |
| Char_CtlCharNotWS, // 027 0x1B |
| Char_CtlCharNotWS, // 028 0x1C |
| Char_CtlCharNotWS, // 029 0x1D |
| Char_CtlCharNotWS, // 030 0x1E |
| Char_CtlCharNotWS, // 031 0x1F |
| Char_Space, // 032 0x20 |
| Char_Exclamation, // 033 0x21 |
| Char_DoubleQuote, // 034 0x22 |
| Char_Sharp, // 035 0x23 |
| Char_DollarSign, // 036 0x24 |
| Char_Percent, // 037 0x25 |
| Char_Ampersand, // 038 0x26 |
| Char_SingleQuote, // 039 0x27 |
| Char_LeftParen, // 040 0x28 |
| Char_RightParen, // 041 0x29 |
| Char_Star, // 042 0x2A |
| Char_Plus, // 043 0x2B |
| Char_Comma, // 044 0x2C |
| Char_Minus, // 045 0x2D |
| Char_Dot, // 046 0x2E |
| Char_Slash, // 047 0x2F |
| Char_0, // 048 0x30 |
| Char_1, // 049 0x31 |
| Char_2, // 050 0x32 |
| Char_3, // 051 0x33 |
| Char_4, // 052 0x34 |
| Char_5, // 053 0x35 |
| Char_6, // 054 0x36 |
| Char_7, // 055 0x37 |
| Char_8, // 056 0x38 |
| Char_9, // 057 0x39 |
| Char_Colon, // 058 0x3A |
| Char_SemiColon, // 059 0x3B |
| Char_LessThan, // 060 0x3C |
| Char_Equal, // 061 0x3D |
| Char_GreaterThan, // 062 0x3E |
| Char_QuestionMark, // 063 0x3F |
| Char_AtSign, // 064 0x40 |
| Char_A, // 065 0x41 |
| Char_B, // 066 0x42 |
| Char_C, // 067 0x43 |
| Char_D, // 068 0x44 |
| Char_E, // 069 0x45 |
| Char_F, // 070 0x46 |
| Char_G, // 071 0x47 |
| Char_H, // 072 0x48 |
| Char_I, // 073 0x49 |
| Char_J, // 074 0x4A |
| Char_K, // 075 0x4B |
| Char_L, // 076 0x4C |
| Char_M, // 077 0x4D |
| Char_N, // 078 0x4E |
| Char_O, // 079 0x4F |
| Char_P, // 080 0x50 |
| Char_Q, // 081 0x51 |
| Char_R, // 082 0x52 |
| Char_S, // 083 0x53 |
| Char_T, // 084 0x54 |
| Char_U, // 085 0x55 |
| Char_V, // 086 0x56 |
| Char_W, // 087 0x57 |
| Char_X, // 088 0x58 |
| Char_Y, // 089 0x59 |
| Char_Z, // 090 0x5A |
| Char_LeftBracket, // 091 0x5B |
| Char_BackSlash, // 092 0x5C |
| Char_RightBracket, // 093 0x5D |
| Char_Caret, // 094 0x5E |
| Char__, // 095 0x5F |
| Char_BackQuote, // 096 0x60 |
| Char_a, // 097 0x61 |
| Char_b, // 098 0x62 |
| Char_c, // 099 0x63 |
| Char_d, // 100 0x64 |
| Char_e, // 101 0x65 |
| Char_f, // 102 0x66 |
| Char_g, // 103 0x67 |
| Char_h, // 104 0x68 |
| Char_i, // 105 0x69 |
| Char_j, // 106 0x6A |
| Char_k, // 107 0x6B |
| Char_l, // 108 0x6C |
| Char_m, // 109 0x6D |
| Char_n, // 110 0x6E |
| Char_o, // 111 0x6F |
| Char_p, // 112 0x70 |
| Char_q, // 113 0x71 |
| Char_r, // 114 0x72 |
| Char_s, // 115 0x73 |
| Char_t, // 116 0x74 |
| Char_u, // 117 0x75 |
| Char_v, // 118 0x76 |
| Char_w, // 119 0x77 |
| Char_x, // 120 0x78 |
| Char_y, // 121 0x79 |
| Char_z, // 122 0x7A |
| Char_LeftBrace, // 123 0x7B |
| Char_VerticalBar, // 124 0x7C |
| Char_RightBrace, // 125 0x7D |
| Char_Tilde, // 126 0x7E |
| // [artem] As I understand, there's no need to specify characters |
| // other than those |
| // we'll try to access by index from getKind method (iow, this array |
| // is auxilary |
| // as I indicated in its comment). Thus, there seems to be no reason |
| // to specify |
| // Char_Acute here as it's done in OCL's LexerBasicMap.g |
| Char_AfterASCII, // for all chars in range 128..65534 |
| Char_EOF // for '\uffff' or 65535 |
| }; |
| |
| // Classify character at ith location |
| @Override |
| public final int getKind(int i) { |
| char c = (i >= getStreamLength() ? '\uffff' : getCharValue(i)); |
| return (c < 128 // ASCII Character |
| ? tokenKind[c] |
| : c == '\uffff' ? Char_EOF : getNonAsciiKind(c)); |
| |
| } |
| |
| private final static int getNonAsciiKind(char c) { |
| if (c == '\u00AB') { |
| return Char_LG; |
| } |
| if (c == '\u00BB') { |
| return Char_RG; |
| } |
| if (c == '\u00b4') { |
| return Char_Acute; // For OCLLexer |
| } |
| return Char_AfterASCII; |
| |
| } |
| |
| public ErrorLocationInfo[] getErrors() { |
| return errors.toArray(new ErrorLocationInfo[errors.size()]); |
| } |
| |
| private void resetErrors() { |
| errors.clear(); |
| } |
| |
| private final List<ErrorLocationInfo> errors = new LinkedList<ErrorLocationInfo>(); |
| |
| @Override |
| public void reportError(int i, String code) { |
| Activator.logWarn("Unexpected #reportError(int,String)"); |
| reportError(i, i); |
| } |
| |
| @Override |
| public void reportError(int leftToken, int rightToken) { |
| final int errorCode = (rightToken >= getStreamLength() ? EOF_CODE : leftToken == rightToken ? LEX_ERROR_CODE : INVALID_TOKEN_CODE); |
| final int endToken = (leftToken == rightToken ? rightToken : rightToken - 1); |
| reportError(errorCode, null, leftToken, endToken, getName(leftToken)); |
| } |
| |
| @Override |
| public void reportError(int errorCode, String locationInfo, String tokenText) { |
| try { |
| Matcher m = Pattern.compile("(?:[^:]+::)*[^:]+:(\\d+):(\\d+):(\\d+):(\\d+):.*").matcher(locationInfo); |
| boolean t = m.matches(); // ignore return value, rely on exception |
| // if anything wrong |
| assert t; |
| final int leftTokenLine = Integer.parseInt(m.group(1)); |
| final int leftTokenColumn = Integer.parseInt(m.group(2)); |
| final int rightTokenLine = Integer.parseInt(m.group(3)); |
| final int rightTokenColumn = Integer.parseInt(m.group(4)); |
| final String msg = tokenText + errorMsgText[errorCode]; |
| errors.add(new ErrorLocationInfo(msg, leftTokenLine, leftTokenColumn, rightTokenLine, rightTokenColumn)); |
| } catch (Throwable ex) { |
| // ignore |
| errors.add(new ErrorLocationInfo(tokenText + errorMsgText[errorCode])); |
| } |
| } |
| |
| @Override |
| public void reportError(int errorCode, String locationInfo, int leftToken, int rightToken, String tokenText) { |
| final int leftTokenLine = getLine(leftToken); |
| final int leftTokenColumn = getColumn(leftToken); |
| final int rightTokenLine = getEndLine(rightToken); |
| final int rightTokenColumn = getEndColumn(rightToken); |
| final String msg = tokenText + errorMsgText[errorCode] + (locationInfo != null && locationInfo.length() > 0 ? '(' + locationInfo + ')' : ""); |
| final int startOffset = leftToken; |
| final int endOffset = rightToken; |
| errors.add(new ErrorLocationInfo(msg, leftTokenLine, leftTokenColumn, rightTokenLine, rightTokenColumn, startOffset, endOffset)); |
| } |
| |
| /* |
| |
| */ |
| |
| public void ruleAction(int ruleNumber) { |
| switch (ruleNumber) { |
| |
| // |
| // Rule 1: Token ::= Identifier |
| // |
| case 1: { |
| checkForKeyWord(); |
| break; |
| } |
| |
| // |
| // Rule 2: Token ::= EscapedSQ |
| // |
| case 2: { |
| makeToken(TK_STRING_LITERAL); |
| break; |
| } |
| |
| // |
| // Rule 3: Token ::= SingleQuote SLNotSQ SingleQuote |
| // |
| case 3: { |
| makeToken(TK_STRING_LITERAL); |
| break; |
| } |
| |
| // |
| // Rule 4: Token ::= Acute SLNotSQOpt Acute |
| // |
| case 4: { |
| makeToken(TK_STRING_LITERAL); |
| break; |
| } |
| |
| // |
| // Rule 5: Token ::= BackQuote SLNotSQOpt Acute |
| // |
| case 5: { |
| makeToken(TK_STRING_LITERAL); |
| break; |
| } |
| |
| // |
| // Rule 6: Token ::= IntegerLiteral |
| // |
| case 6: |
| break; |
| |
| // |
| // Rule 7: Token ::= IntegerLiteral DotToken |
| // |
| case 7: |
| break; |
| |
| // |
| // Rule 8: Token ::= IntegerLiteral DotDotToken |
| // |
| case 8: |
| break; |
| |
| // |
| // Rule 9: Token ::= RealLiteral |
| // |
| case 9: { |
| makeToken(TK_REAL_LITERAL); |
| break; |
| } |
| |
| // |
| // Rule 10: Token ::= SLC |
| // |
| case 10: { |
| makeComment(TK_SINGLE_LINE_COMMENT); |
| break; |
| } |
| |
| // |
| // Rule 11: Token ::= / * Inside Stars / |
| // |
| case 11: { |
| makeComment(TK_MULTI_LINE_COMMENT); |
| break; |
| } |
| |
| // |
| // Rule 12: Token ::= WS |
| // |
| case 12: { |
| skipToken(); |
| break; |
| } |
| |
| // |
| // Rule 13: Token ::= + |
| // |
| case 13: { |
| makeToken(TK_PLUS); |
| break; |
| } |
| |
| // |
| // Rule 14: Token ::= - |
| // |
| case 14: { |
| makeToken(TK_MINUS); |
| break; |
| } |
| |
| // |
| // Rule 15: Token ::= * |
| // |
| case 15: { |
| makeToken(TK_MULTIPLY); |
| break; |
| } |
| |
| // |
| // Rule 16: Token ::= / |
| // |
| case 16: { |
| makeToken(TK_DIVIDE); |
| break; |
| } |
| |
| // |
| // Rule 17: Token ::= ( |
| // |
| case 17: { |
| makeToken(TK_LPAREN); |
| break; |
| } |
| |
| // |
| // Rule 18: Token ::= ) |
| // |
| case 18: { |
| makeToken(TK_RPAREN); |
| break; |
| } |
| |
| // |
| // Rule 19: Token ::= > |
| // |
| case 19: { |
| makeToken(TK_GREATER); |
| break; |
| } |
| |
| // |
| // Rule 20: Token ::= < |
| // |
| case 20: { |
| makeToken(TK_LESS); |
| break; |
| } |
| |
| // |
| // Rule 21: Token ::= = |
| // |
| case 21: { |
| makeToken(TK_EQUAL); |
| break; |
| } |
| |
| // |
| // Rule 22: Token ::= > = |
| // |
| case 22: { |
| makeToken(TK_GREATER_EQUAL); |
| break; |
| } |
| |
| // |
| // Rule 23: Token ::= < = |
| // |
| case 23: { |
| makeToken(TK_LESS_EQUAL); |
| break; |
| } |
| |
| // |
| // Rule 24: Token ::= < > |
| // |
| case 24: { |
| makeToken(TK_NOT_EQUAL); |
| break; |
| } |
| |
| // |
| // Rule 25: Token ::= [ |
| // |
| case 25: { |
| makeToken(TK_LBRACKET); |
| break; |
| } |
| |
| // |
| // Rule 26: Token ::= ] |
| // |
| case 26: { |
| makeToken(TK_RBRACKET); |
| break; |
| } |
| |
| // |
| // Rule 27: Token ::= { |
| // |
| case 27: { |
| makeToken(TK_LBRACE); |
| break; |
| } |
| |
| // |
| // Rule 28: Token ::= } |
| // |
| case 28: { |
| makeToken(TK_RBRACE); |
| break; |
| } |
| |
| // |
| // Rule 29: Token ::= - > |
| // |
| case 29: { |
| makeToken(TK_ARROW); |
| break; |
| } |
| |
| // |
| // Rule 30: Token ::= | |
| // |
| case 30: { |
| makeToken(TK_BAR); |
| break; |
| } |
| |
| // |
| // Rule 31: Token ::= , |
| // |
| case 31: { |
| makeToken(TK_COMMA); |
| break; |
| } |
| |
| // |
| // Rule 32: Token ::= : |
| // |
| case 32: { |
| makeToken(TK_COLON); |
| break; |
| } |
| |
| // |
| // Rule 33: Token ::= : : |
| // |
| case 33: { |
| makeToken(TK_COLONCOLON); |
| break; |
| } |
| |
| // |
| // Rule 34: Token ::= ; |
| // |
| case 34: { |
| makeToken(TK_SEMICOLON); |
| break; |
| } |
| |
| // |
| // Rule 35: Token ::= DotToken |
| // |
| case 35: |
| break; |
| |
| // |
| // Rule 36: DotToken ::= . |
| // |
| case 36: { |
| makeToken(TK_DOT); |
| break; |
| } |
| |
| // |
| // Rule 37: Token ::= DotDotToken |
| // |
| case 37: |
| break; |
| |
| // |
| // Rule 38: DotDotToken ::= . . |
| // |
| case 38: { |
| makeToken(TK_DOTDOT); |
| break; |
| } |
| |
| // |
| // Rule 39: IntegerLiteral ::= Integer |
| // |
| case 39: { |
| makeToken(TK_INTEGER_LITERAL); |
| break; |
| } |
| |
| // |
| // Rule 264: Token ::= @ |
| // |
| case 264: { |
| makeToken(TK_AT); |
| break; |
| } |
| |
| // |
| // Rule 265: Token ::= ^ |
| // |
| case 265: { |
| makeToken(TK_CARET); |
| break; |
| } |
| |
| // |
| // Rule 266: Token ::= ^ ^ |
| // |
| case 266: { |
| makeToken(TK_CARETCARET); |
| break; |
| } |
| |
| // |
| // Rule 267: Token ::= ? |
| // |
| case 267: { |
| makeToken(TK_QUESTIONMARK); |
| break; |
| } |
| |
| // |
| // Rule 268: Token ::= : = |
| // |
| case 268: { |
| makeToken(TK_RESET_ASSIGN); |
| break; |
| } |
| |
| // |
| // Rule 269: Token ::= + = |
| // |
| case 269: { |
| makeToken(TK_ADD_ASSIGN); |
| break; |
| } |
| |
| // |
| // Rule 270: Token ::= ! |
| // |
| case 270: { |
| makeToken(TK_EXCLAMATION_MARK); |
| break; |
| } |
| |
| // |
| // Rule 271: Token ::= ! = |
| // |
| case 271: { |
| makeToken(TK_NOT_EQUAL_EXEQ); |
| break; |
| } |
| |
| // |
| // Rule 272: Token ::= < < |
| // |
| case 272: { |
| makeToken(TK_STEREOTYPE_QUALIFIER_OPEN); |
| break; |
| } |
| |
| // |
| // Rule 273: Token ::= > > |
| // |
| case 273: { |
| makeToken(TK_STEREOTYPE_QUALIFIER_CLOSE); |
| break; |
| } |
| |
| // |
| // Rule 274: Token ::= . . . |
| // |
| case 274: { |
| makeToken(TK_MULTIPLICITY_RANGE); |
| break; |
| } |
| |
| // |
| // Rule 275: Token ::= ~ |
| // |
| case 275: { |
| makeToken(TK_TILDE_SIGN); |
| break; |
| } |
| |
| // |
| // Rule 276: Token ::= : : = |
| // |
| case 276: { |
| makeToken(TK_COLONCOLONEQUAL); |
| break; |
| } |
| |
| // |
| // Rule 284: Token ::= DoubleQuote SLNotDQOpt DoubleQuote |
| // |
| case 284: { |
| makeToken(TK_STRING_LITERAL); |
| break; |
| } |
| |
| // |
| // Rule 288: Token ::= LG |
| // |
| case 288: { |
| makeToken(TK_LG); |
| break; |
| } |
| // |
| // Rule 289: Token ::= RG textAny lgOpt |
| // |
| case 289: { |
| makeToken(TK_TEXT); |
| break; |
| } |
| // |
| // Rule 299: Token ::= R E M RG commentAny lgPlus E N D R E M |
| // |
| case 299: { |
| skipToken(); |
| break; |
| } |
| |
| default: |
| break; |
| } |
| return; |
| } |
| } |