blob: 31acadf8e54b7362d8c8ba8e04a18d64aaaf9034 [file] [log] [blame]
/*
* Copyright (c) 2006, 2009 Borland Software Corporation and others.
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License v1.0
* which accompanies this distribution, and is available at
* http://www.eclipse.org/legal/epl-v10.html
*
* Contributors:
* committers of openArchitectureWare - Xpand language syntax
* Artem Tikhomirov (Borland) - LALR grammar
* - Migration to OCL expressions
*/
package org.eclipse.gmf.internal.xpand.parser;
import java.util.LinkedList;
import java.util.List;
import java.util.regex.Matcher;
import java.util.regex.Pattern;
import lpg.lpgjavaruntime.LexParser;
import lpg.lpgjavaruntime.LexStream;
import lpg.lpgjavaruntime.LpgLexStream;
import lpg.lpgjavaruntime.Monitor;
import lpg.lpgjavaruntime.ParseTable;
import lpg.lpgjavaruntime.PrsStream;
import lpg.lpgjavaruntime.RuleAction;
import org.eclipse.gmf.internal.xpand.Activator;
import org.eclipse.gmf.internal.xpand.util.ParserException.ErrorLocationInfo;
public class XpandLexer extends LpgLexStream implements XpandParsersym, XpandLexersym, RuleAction {
private static ParseTable prs = new XpandLexerprs();
private PrsStream prsStream;
private final LexParser lexParser = new LexParser(this, prs, this);
private XpandKWLexer kwLexer;
public PrsStream getPrsStream() {
return prsStream;
}
public int getToken(int i) {
return lexParser.getToken(i);
}
public int getRhsFirstTokenIndex(int i) {
return lexParser.getFirstToken(i);
}
public int getRhsLastTokenIndex(int i) {
return lexParser.getLastToken(i);
}
public int getLeftSpan() {
return lexParser.getFirstToken();
}
public int getRightSpan() {
return lexParser.getLastToken();
}
public XpandLexer(char[] input_chars, String filename, int tab) {
super(input_chars, filename, tab);
}
public XpandLexer(char[] input_chars, String filename) {
this(input_chars, filename, 4);
}
public String[] orderedExportedSymbols() {
return XpandParsersym.orderedTerminalSymbols;
}
public LexStream getLexStream() {
return (LexStream) this;
}
public int[] getKeywordKinds() {
return kwLexer.getKeywordKinds();
}
public void lexer(PrsStream prsStream) {
lexer(null, prsStream);
}
public void lexer(Monitor monitor, PrsStream prsStream) {
if (getInputChars() == null) {
throw new NullPointerException("LexStream was not initialized");
}
this.prsStream = prsStream;
resetErrors();
prsStream.makeToken(0, 0, 0); // Token list must start with a bad token
lexParser.parseCharacters(monitor); // Lex the input characters
int i = getStreamIndex();
prsStream.makeToken(i, i, TK_EOF_TOKEN); // and end with the end of file
// token
prsStream.setStreamLength(prsStream.getSize());
return;
}
@Override
public void initialize(char[] content, String filename) {
super.initialize(content, filename);
if (this.kwLexer == null) {
this.kwLexer = new XpandKWLexer(getInputChars(), TK_IDENTIFIER);
} else {
this.kwLexer.setInputChars(getInputChars());
}
}
final void makeToken(int kind) {
int startOffset = getLeftSpan(), endOffset = getRightSpan();
makeToken(startOffset, endOffset, kind);
}
final void makeComment(int kind) {
int startOffset = getLeftSpan(), endOffset = getRightSpan();
super.getPrsStream().makeAdjunct(startOffset, endOffset, kind);
}
final void skipToken() {
}
final void checkForKeyWord() {
int startOffset = getLeftSpan(), endOffset = getRightSpan(), kwKind = kwLexer.lexer(startOffset, endOffset);
makeToken(startOffset, endOffset, kwKind);
}
// aux data for getKind method
private final int tokenKind[] = { Char_CtlCharNotWS, // 000 0x00
Char_CtlCharNotWS, // 001 0x01
Char_CtlCharNotWS, // 002 0x02
Char_CtlCharNotWS, // 003 0x03
Char_CtlCharNotWS, // 004 0x04
Char_CtlCharNotWS, // 005 0x05
Char_CtlCharNotWS, // 006 0x06
Char_CtlCharNotWS, // 007 0x07
Char_CtlCharNotWS, // 008 0x08
Char_HT, // 009 0x09
Char_LF, // 010 0x0A
Char_CtlCharNotWS, // 011 0x0B
Char_FF, // 012 0x0C
Char_CR, // 013 0x0D
Char_CtlCharNotWS, // 014 0x0E
Char_CtlCharNotWS, // 015 0x0F
Char_CtlCharNotWS, // 016 0x10
Char_CtlCharNotWS, // 017 0x11
Char_CtlCharNotWS, // 018 0x12
Char_CtlCharNotWS, // 019 0x13
Char_CtlCharNotWS, // 020 0x14
Char_CtlCharNotWS, // 021 0x15
Char_CtlCharNotWS, // 022 0x16
Char_CtlCharNotWS, // 023 0x17
Char_CtlCharNotWS, // 024 0x18
Char_CtlCharNotWS, // 025 0x19
Char_CtlCharNotWS, // 026 0x1A
Char_CtlCharNotWS, // 027 0x1B
Char_CtlCharNotWS, // 028 0x1C
Char_CtlCharNotWS, // 029 0x1D
Char_CtlCharNotWS, // 030 0x1E
Char_CtlCharNotWS, // 031 0x1F
Char_Space, // 032 0x20
Char_Exclamation, // 033 0x21
Char_DoubleQuote, // 034 0x22
Char_Sharp, // 035 0x23
Char_DollarSign, // 036 0x24
Char_Percent, // 037 0x25
Char_Ampersand, // 038 0x26
Char_SingleQuote, // 039 0x27
Char_LeftParen, // 040 0x28
Char_RightParen, // 041 0x29
Char_Star, // 042 0x2A
Char_Plus, // 043 0x2B
Char_Comma, // 044 0x2C
Char_Minus, // 045 0x2D
Char_Dot, // 046 0x2E
Char_Slash, // 047 0x2F
Char_0, // 048 0x30
Char_1, // 049 0x31
Char_2, // 050 0x32
Char_3, // 051 0x33
Char_4, // 052 0x34
Char_5, // 053 0x35
Char_6, // 054 0x36
Char_7, // 055 0x37
Char_8, // 056 0x38
Char_9, // 057 0x39
Char_Colon, // 058 0x3A
Char_SemiColon, // 059 0x3B
Char_LessThan, // 060 0x3C
Char_Equal, // 061 0x3D
Char_GreaterThan, // 062 0x3E
Char_QuestionMark, // 063 0x3F
Char_AtSign, // 064 0x40
Char_A, // 065 0x41
Char_B, // 066 0x42
Char_C, // 067 0x43
Char_D, // 068 0x44
Char_E, // 069 0x45
Char_F, // 070 0x46
Char_G, // 071 0x47
Char_H, // 072 0x48
Char_I, // 073 0x49
Char_J, // 074 0x4A
Char_K, // 075 0x4B
Char_L, // 076 0x4C
Char_M, // 077 0x4D
Char_N, // 078 0x4E
Char_O, // 079 0x4F
Char_P, // 080 0x50
Char_Q, // 081 0x51
Char_R, // 082 0x52
Char_S, // 083 0x53
Char_T, // 084 0x54
Char_U, // 085 0x55
Char_V, // 086 0x56
Char_W, // 087 0x57
Char_X, // 088 0x58
Char_Y, // 089 0x59
Char_Z, // 090 0x5A
Char_LeftBracket, // 091 0x5B
Char_BackSlash, // 092 0x5C
Char_RightBracket, // 093 0x5D
Char_Caret, // 094 0x5E
Char__, // 095 0x5F
Char_BackQuote, // 096 0x60
Char_a, // 097 0x61
Char_b, // 098 0x62
Char_c, // 099 0x63
Char_d, // 100 0x64
Char_e, // 101 0x65
Char_f, // 102 0x66
Char_g, // 103 0x67
Char_h, // 104 0x68
Char_i, // 105 0x69
Char_j, // 106 0x6A
Char_k, // 107 0x6B
Char_l, // 108 0x6C
Char_m, // 109 0x6D
Char_n, // 110 0x6E
Char_o, // 111 0x6F
Char_p, // 112 0x70
Char_q, // 113 0x71
Char_r, // 114 0x72
Char_s, // 115 0x73
Char_t, // 116 0x74
Char_u, // 117 0x75
Char_v, // 118 0x76
Char_w, // 119 0x77
Char_x, // 120 0x78
Char_y, // 121 0x79
Char_z, // 122 0x7A
Char_LeftBrace, // 123 0x7B
Char_VerticalBar, // 124 0x7C
Char_RightBrace, // 125 0x7D
Char_Tilde, // 126 0x7E
// [artem] As I understand, there's no need to specify characters
// other than those
// we'll try to access by index from getKind method (iow, this array
// is auxilary
// as I indicated in its comment). Thus, there seems to be no reason
// to specify
// Char_Acute here as it's done in OCL's LexerBasicMap.g
Char_AfterASCII, // for all chars in range 128..65534
Char_EOF // for '\uffff' or 65535
};
// Classify character at ith location
@Override
public final int getKind(int i) {
char c = (i >= getStreamLength() ? '\uffff' : getCharValue(i));
return (c < 128 // ASCII Character
? tokenKind[c]
: c == '\uffff' ? Char_EOF : getNonAsciiKind(c));
}
private final static int getNonAsciiKind(char c) {
if (c == '\u00AB') {
return Char_LG;
}
if (c == '\u00BB') {
return Char_RG;
}
if (c == '\u00b4') {
return Char_Acute; // For OCLLexer
}
return Char_AfterASCII;
}
public ErrorLocationInfo[] getErrors() {
return errors.toArray(new ErrorLocationInfo[errors.size()]);
}
private void resetErrors() {
errors.clear();
}
private final List<ErrorLocationInfo> errors = new LinkedList<ErrorLocationInfo>();
@Override
public void reportError(int i, String code) {
Activator.logWarn("Unexpected #reportError(int,String)");
reportError(i, i);
}
@Override
public void reportError(int leftToken, int rightToken) {
final int errorCode = (rightToken >= getStreamLength() ? EOF_CODE : leftToken == rightToken ? LEX_ERROR_CODE : INVALID_TOKEN_CODE);
final int endToken = (leftToken == rightToken ? rightToken : rightToken - 1);
reportError(errorCode, null, leftToken, endToken, getName(leftToken));
}
@Override
public void reportError(int errorCode, String locationInfo, String tokenText) {
try {
Matcher m = Pattern.compile("(?:[^:]+::)*[^:]+:(\\d+):(\\d+):(\\d+):(\\d+):.*").matcher(locationInfo);
boolean t = m.matches(); // ignore return value, rely on exception
// if anything wrong
assert t;
final int leftTokenLine = Integer.parseInt(m.group(1));
final int leftTokenColumn = Integer.parseInt(m.group(2));
final int rightTokenLine = Integer.parseInt(m.group(3));
final int rightTokenColumn = Integer.parseInt(m.group(4));
final String msg = tokenText + errorMsgText[errorCode];
errors.add(new ErrorLocationInfo(msg, leftTokenLine, leftTokenColumn, rightTokenLine, rightTokenColumn));
} catch (Throwable ex) {
// ignore
errors.add(new ErrorLocationInfo(tokenText + errorMsgText[errorCode]));
}
}
@Override
public void reportError(int errorCode, String locationInfo, int leftToken, int rightToken, String tokenText) {
final int leftTokenLine = getLine(leftToken);
final int leftTokenColumn = getColumn(leftToken);
final int rightTokenLine = getEndLine(rightToken);
final int rightTokenColumn = getEndColumn(rightToken);
final String msg = tokenText + errorMsgText[errorCode] + (locationInfo != null && locationInfo.length() > 0 ? '(' + locationInfo + ')' : "");
final int startOffset = leftToken;
final int endOffset = rightToken;
errors.add(new ErrorLocationInfo(msg, leftTokenLine, leftTokenColumn, rightTokenLine, rightTokenColumn, startOffset, endOffset));
}
/*
*/
public void ruleAction(int ruleNumber) {
switch (ruleNumber) {
//
// Rule 1: Token ::= Identifier
//
case 1: {
checkForKeyWord();
break;
}
//
// Rule 2: Token ::= EscapedSQ
//
case 2: {
makeToken(TK_STRING_LITERAL);
break;
}
//
// Rule 3: Token ::= SingleQuote SLNotSQ SingleQuote
//
case 3: {
makeToken(TK_STRING_LITERAL);
break;
}
//
// Rule 4: Token ::= Acute SLNotSQOpt Acute
//
case 4: {
makeToken(TK_STRING_LITERAL);
break;
}
//
// Rule 5: Token ::= BackQuote SLNotSQOpt Acute
//
case 5: {
makeToken(TK_STRING_LITERAL);
break;
}
//
// Rule 6: Token ::= IntegerLiteral
//
case 6:
break;
//
// Rule 7: Token ::= IntegerLiteral DotToken
//
case 7:
break;
//
// Rule 8: Token ::= IntegerLiteral DotDotToken
//
case 8:
break;
//
// Rule 9: Token ::= RealLiteral
//
case 9: {
makeToken(TK_REAL_LITERAL);
break;
}
//
// Rule 10: Token ::= SLC
//
case 10: {
makeComment(TK_SINGLE_LINE_COMMENT);
break;
}
//
// Rule 11: Token ::= / * Inside Stars /
//
case 11: {
makeComment(TK_MULTI_LINE_COMMENT);
break;
}
//
// Rule 12: Token ::= WS
//
case 12: {
skipToken();
break;
}
//
// Rule 13: Token ::= +
//
case 13: {
makeToken(TK_PLUS);
break;
}
//
// Rule 14: Token ::= -
//
case 14: {
makeToken(TK_MINUS);
break;
}
//
// Rule 15: Token ::= *
//
case 15: {
makeToken(TK_MULTIPLY);
break;
}
//
// Rule 16: Token ::= /
//
case 16: {
makeToken(TK_DIVIDE);
break;
}
//
// Rule 17: Token ::= (
//
case 17: {
makeToken(TK_LPAREN);
break;
}
//
// Rule 18: Token ::= )
//
case 18: {
makeToken(TK_RPAREN);
break;
}
//
// Rule 19: Token ::= >
//
case 19: {
makeToken(TK_GREATER);
break;
}
//
// Rule 20: Token ::= <
//
case 20: {
makeToken(TK_LESS);
break;
}
//
// Rule 21: Token ::= =
//
case 21: {
makeToken(TK_EQUAL);
break;
}
//
// Rule 22: Token ::= > =
//
case 22: {
makeToken(TK_GREATER_EQUAL);
break;
}
//
// Rule 23: Token ::= < =
//
case 23: {
makeToken(TK_LESS_EQUAL);
break;
}
//
// Rule 24: Token ::= < >
//
case 24: {
makeToken(TK_NOT_EQUAL);
break;
}
//
// Rule 25: Token ::= [
//
case 25: {
makeToken(TK_LBRACKET);
break;
}
//
// Rule 26: Token ::= ]
//
case 26: {
makeToken(TK_RBRACKET);
break;
}
//
// Rule 27: Token ::= {
//
case 27: {
makeToken(TK_LBRACE);
break;
}
//
// Rule 28: Token ::= }
//
case 28: {
makeToken(TK_RBRACE);
break;
}
//
// Rule 29: Token ::= - >
//
case 29: {
makeToken(TK_ARROW);
break;
}
//
// Rule 30: Token ::= |
//
case 30: {
makeToken(TK_BAR);
break;
}
//
// Rule 31: Token ::= ,
//
case 31: {
makeToken(TK_COMMA);
break;
}
//
// Rule 32: Token ::= :
//
case 32: {
makeToken(TK_COLON);
break;
}
//
// Rule 33: Token ::= : :
//
case 33: {
makeToken(TK_COLONCOLON);
break;
}
//
// Rule 34: Token ::= ;
//
case 34: {
makeToken(TK_SEMICOLON);
break;
}
//
// Rule 35: Token ::= DotToken
//
case 35:
break;
//
// Rule 36: DotToken ::= .
//
case 36: {
makeToken(TK_DOT);
break;
}
//
// Rule 37: Token ::= DotDotToken
//
case 37:
break;
//
// Rule 38: DotDotToken ::= . .
//
case 38: {
makeToken(TK_DOTDOT);
break;
}
//
// Rule 39: IntegerLiteral ::= Integer
//
case 39: {
makeToken(TK_INTEGER_LITERAL);
break;
}
//
// Rule 264: Token ::= @
//
case 264: {
makeToken(TK_AT);
break;
}
//
// Rule 265: Token ::= ^
//
case 265: {
makeToken(TK_CARET);
break;
}
//
// Rule 266: Token ::= ^ ^
//
case 266: {
makeToken(TK_CARETCARET);
break;
}
//
// Rule 267: Token ::= ?
//
case 267: {
makeToken(TK_QUESTIONMARK);
break;
}
//
// Rule 268: Token ::= : =
//
case 268: {
makeToken(TK_RESET_ASSIGN);
break;
}
//
// Rule 269: Token ::= + =
//
case 269: {
makeToken(TK_ADD_ASSIGN);
break;
}
//
// Rule 270: Token ::= !
//
case 270: {
makeToken(TK_EXCLAMATION_MARK);
break;
}
//
// Rule 271: Token ::= ! =
//
case 271: {
makeToken(TK_NOT_EQUAL_EXEQ);
break;
}
//
// Rule 272: Token ::= < <
//
case 272: {
makeToken(TK_STEREOTYPE_QUALIFIER_OPEN);
break;
}
//
// Rule 273: Token ::= > >
//
case 273: {
makeToken(TK_STEREOTYPE_QUALIFIER_CLOSE);
break;
}
//
// Rule 274: Token ::= . . .
//
case 274: {
makeToken(TK_MULTIPLICITY_RANGE);
break;
}
//
// Rule 275: Token ::= ~
//
case 275: {
makeToken(TK_TILDE_SIGN);
break;
}
//
// Rule 276: Token ::= : : =
//
case 276: {
makeToken(TK_COLONCOLONEQUAL);
break;
}
//
// Rule 284: Token ::= DoubleQuote SLNotDQOpt DoubleQuote
//
case 284: {
makeToken(TK_STRING_LITERAL);
break;
}
//
// Rule 288: Token ::= LG
//
case 288: {
makeToken(TK_LG);
break;
}
//
// Rule 289: Token ::= RG textAny lgOpt
//
case 289: {
makeToken(TK_TEXT);
break;
}
//
// Rule 299: Token ::= R E M RG commentAny lgPlus E N D R E M
//
case 299: {
skipToken();
break;
}
default:
break;
}
return;
}
}