blob: 090e888f16ebb7f00a9ee6c99f6ad76bea605dfd [file] [log] [blame]
/* The following code was generated by JFlex 1.2.2 on 8/6/16 1:32 PM */
/*******************************************************************************
* Copyright (c) 2004, 2016 IBM Corporation and others.
* All rights reserved. This program and the accompanying materials
* are made available under the terms of the Eclipse Public License 2.0
* which accompanies this distribution, and is available at
* https://www.eclipse.org/legal/epl-2.0/
*
* SPDX-License-Identifier: EPL-2.0
*
* Contributors:
* IBM Corporation - initial API and implementation
*******************************************************************************/
package org.eclipse.wst.html.core.internal.parser;
import java.io.CharArrayReader;
import java.io.IOException;
import java.util.ArrayList;
import java.util.Iterator;
import java.util.List;
import org.eclipse.wst.html.core.internal.contenttype.IntStack;
import org.eclipse.wst.sse.core.internal.ltk.parser.BlockMarker;
import org.eclipse.wst.sse.core.internal.ltk.parser.BlockTokenizer;
import org.eclipse.wst.sse.core.internal.provisional.text.ITextRegion;
import org.eclipse.wst.sse.core.internal.util.Debug;
import org.eclipse.wst.sse.core.utils.StringUtils;
import org.eclipse.wst.xml.core.internal.Logger;
import org.eclipse.wst.xml.core.internal.parser.regions.XMLParserRegionFactory;
import org.eclipse.wst.xml.core.internal.regions.DOMRegionContext;
/**
* Generate with -skel skeleton.sse
*/
/**
* This class is a scanner generated by
* <a href="http://www.informatik.tu-muenchen.de/~kleing/jflex/">JFlex</a> 1.2.2
* on 8/6/16 1:32 PM from the specification file
* <tt>file:/Users/nitin/git/webtools.sourceediting/bundles/org.eclipse.wst.sse.core/DevTimeSupport/SedModel/HTMLTokenizer/devel/HTMLTokenizer.jflex</tt>
*/
public class HTMLTokenizer implements BlockTokenizer, DOMRegionContext {
/** this character denotes the end of file */
final public static int YYEOF = -1;
/** lexical states */
final public static int ST_XML_DOCTYPE_EXTERNAL_ID = 19;
final public static int ST_XML_ELEMENT_DECLARATION_CONTENT = 23;
final public static int ST_XML_PI_TAG_CLOSE = 11;
final public static int ST_XML_DECLARATION_CLOSE = 17;
final public static int ST_XML_PI_ATTRIBUTE_VALUE = 10;
final public static int ST_XML_TAG_NAME = 12;
final public static int ST_XML_ATTRIBUTE_VALUE = 15;
final public static int ST_XML_DOCTYPE_ID_SYSTEM = 21;
final public static int ST_XML_ATTRIBUTE_NAME = 13;
final public static int ST_XML_ELEMENT_DECLARATION = 22;
final public static int ST_XML_DOCTYPE_DECLARATION = 18;
final public static int ST_XML_ATTLIST_DECLARATION = 24;
final public static int ST_XML_COMMENT_END = 4;
final public static int ST_CDATA_TEXT = 1;
final public static int ST_XML_COMMENT = 3;
final public static int ST_PI_CONTENT = 7;
final public static int ST_PI_WS = 6;
final public static int ST_CDATA_END = 2;
final public static int ST_XML_ATTLIST_DECLARATION_CONTENT = 25;
final public static int ST_BLOCK_TAG_SCAN = 26;
final public static int ST_XML_PI_EQUALS = 9;
final public static int ST_XML_DECLARATION = 16;
final public static int YYINITIAL = 0;
final public static int ST_XML_DOCTYPE_ID_PUBLIC = 20;
final public static int ST_XML_EQUALS = 14;
final public static int ST_PI = 5;
final public static int ST_XML_PI_ATTRIBUTE_NAME = 8;
/**
* Translates characters to character classes
*/
final private static String yycmap_packed =
"\11\0\1\5\1\25\2\0\1\20\22\0\1\20\1\24\1\15\1\14"+
"\1\22\1\23\1\16\1\17\1\13\1\13\1\10\1\22\1\22\1\7"+
"\1\6\1\3\12\21\1\10\1\61\1\1\1\46\1\2\1\4\1\22"+
"\1\36\1\62\1\34\1\35\1\51\1\57\1\40\1\40\1\43\1\40"+
"\1\40\1\32\1\30\1\45\1\44\1\50\1\40\1\40\1\56\1\37"+
"\1\60\2\40\1\26\1\47\1\40\1\11\1\0\1\12\1\0\1\10"+
"\1\0\1\53\1\62\1\63\1\54\1\41\1\57\1\40\1\66\1\43"+
"\2\40\1\33\1\31\1\45\1\44\1\50\1\40\1\40\1\42\1\52"+
"\1\60\1\40\1\40\1\27\1\55\1\40\1\0\1\0\72\0\1\65"+
"\10\0\27\64\1\0\37\64\1\0\72\64\2\0\13\64\2\0\10\64"+
"\1\0\65\64\1\0\104\64\11\0\44\64\3\0\2\64\4\0\36\64"+
"\70\0\131\64\22\0\7\64\16\0\2\65\56\0\106\65\32\0\2\65"+
"\44\0\1\64\1\65\3\64\1\0\1\64\1\0\24\64\1\0\54\64"+
"\1\0\7\64\3\0\1\64\1\0\1\64\1\0\1\64\1\0\1\64"+
"\1\0\22\64\15\0\14\64\1\0\102\64\1\0\14\64\1\0\44\64"+
"\1\0\4\65\11\0\65\64\2\0\2\64\2\0\2\64\3\0\34\64"+
"\2\0\10\64\2\0\2\64\67\0\46\64\2\0\1\64\7\0\46\64"+
"\12\0\21\65\1\0\27\65\1\0\3\65\1\0\1\65\1\0\2\65"+
"\1\0\1\65\13\0\33\64\5\0\3\64\56\0\32\64\5\0\1\65"+
"\12\64\10\65\15\0\12\65\6\0\1\65\107\64\2\0\5\64\1\0"+
"\17\64\1\0\4\64\1\0\1\64\17\65\2\64\2\65\1\0\4\65"+
"\2\0\12\65\u0207\0\3\65\1\0\65\64\2\0\1\65\1\64\20\65"+
"\3\0\4\65\3\0\12\64\2\65\2\0\12\65\21\0\3\65\1\0"+
"\10\64\2\0\2\64\2\0\26\64\1\0\7\64\1\0\1\64\3\0"+
"\4\64\2\0\1\65\1\0\7\65\2\0\2\65\2\0\3\65\11\0"+
"\1\65\4\0\2\64\1\0\3\64\2\65\2\0\12\65\2\64\20\0"+
"\1\65\2\0\6\64\4\0\2\64\2\0\26\64\1\0\7\64\1\0"+
"\2\64\1\0\2\64\1\0\2\64\2\0\1\65\1\0\5\65\4\0"+
"\2\65\2\0\3\65\13\0\4\64\1\0\1\64\7\0\12\65\2\65"+
"\3\64\14\0\3\65\1\0\7\64\1\0\1\64\1\0\3\64\1\0"+
"\26\64\1\0\7\64\1\0\2\64\1\0\5\64\2\0\1\65\1\64"+
"\10\65\1\0\3\65\1\0\3\65\22\0\1\64\5\0\12\65\21\0"+
"\3\65\1\0\10\64\2\0\2\64\2\0\26\64\1\0\7\64\1\0"+
"\2\64\2\0\4\64\2\0\1\65\1\64\6\65\3\0\2\65\2\0"+
"\3\65\10\0\2\65\4\0\2\64\1\0\3\64\4\0\12\65\22\0"+
"\2\65\1\0\6\64\3\0\3\64\1\0\4\64\3\0\2\64\1\0"+
"\1\64\1\0\2\64\3\0\2\64\3\0\3\64\3\0\10\64\1\0"+
"\3\64\4\0\5\65\3\0\3\65\1\0\4\65\11\0\1\65\17\0"+
"\11\65\21\0\3\65\1\0\10\64\1\0\3\64\1\0\27\64\1\0"+
"\12\64\1\0\5\64\4\0\7\65\1\0\3\65\1\0\4\65\7\0"+
"\2\65\11\0\2\64\4\0\12\65\22\0\2\65\1\0\10\64\1\0"+
"\3\64\1\0\27\64\1\0\12\64\1\0\5\64\4\0\7\65\1\0"+
"\3\65\1\0\4\65\7\0\2\65\7\0\1\64\1\0\2\64\4\0"+
"\12\65\22\0\2\65\1\0\10\64\1\0\3\64\1\0\27\64\1\0"+
"\20\64\4\0\6\65\2\0\3\65\1\0\4\65\11\0\1\65\10\0"+
"\2\64\4\0\12\65\221\0\56\64\1\0\1\64\1\65\2\64\7\65"+
"\5\0\6\64\1\65\10\65\1\0\12\65\47\0\2\64\1\0\1\64"+
"\2\0\2\64\1\0\1\64\2\0\1\64\6\0\4\64\1\0\7\64"+
"\1\0\3\64\1\0\1\64\1\0\1\64\2\0\2\64\1\0\2\64"+
"\1\0\1\64\1\65\2\64\6\65\1\0\2\65\1\64\2\0\5\64"+
"\1\0\1\65\1\0\6\65\2\0\12\65\76\0\2\65\6\0\12\65"+
"\13\0\1\65\1\0\1\65\1\0\1\65\4\0\2\65\10\64\1\0"+
"\41\64\7\0\24\65\1\0\6\65\4\0\6\65\1\0\1\65\1\0"+
"\25\65\3\0\7\65\1\0\1\65\346\0\46\64\12\0\47\64\11\0"+
"\1\64\1\0\2\64\1\0\3\64\1\0\1\64\1\0\2\64\1\0"+
"\5\64\51\0\1\64\1\0\1\64\1\0\1\64\13\0\1\64\1\0"+
"\1\64\1\0\1\64\3\0\2\64\3\0\1\64\5\0\3\64\1\0"+
"\1\64\1\0\1\64\1\0\1\64\1\0\1\64\3\0\2\64\3\0"+
"\2\64\1\0\1\64\50\0\1\64\11\0\1\64\2\0\1\64\2\0"+
"\2\64\7\0\2\64\1\0\1\64\1\0\7\64\50\0\1\64\4\0"+
"\1\64\10\0\1\64\u0c06\0\234\64\4\0\132\64\6\0\26\64\2\0"+
"\6\64\2\0\46\64\2\0\6\64\2\0\10\64\1\0\1\64\1\0"+
"\1\64\1\0\1\64\1\0\37\64\2\0\65\64\1\0\7\64\1\0"+
"\1\64\3\0\3\64\1\0\7\64\3\0\4\64\2\0\6\64\4\0"+
"\15\64\5\0\3\64\1\0\7\64\323\0\15\65\4\0\1\65\104\0"+
"\1\64\3\0\2\64\2\0\1\64\121\0\3\64\u0e82\0\1\65\1\0"+
"\1\64\31\0\11\64\6\65\1\0\5\65\13\0\124\64\4\0\2\65"+
"\2\0\2\65\2\0\132\64\1\0\3\65\6\0\50\64\u1cd3\0\u51a6\64"+
"\u0c5a\0\u2ba4\64\134\0\u0800\0\u1ffe\0\2\0";
/**
* Translates characters to character classes
*/
final private static char [] yycmap = yy_unpack_cmap(yycmap_packed);
/**
* Translates a state to a row index in the transition table
*/
final private static int yy_rowMap [] = {
0, 55, 110, 165, 220, 275, 330, 385, 440, 495,
550, 605, 660, 715, 770, 825, 880, 935, 990, 1045,
1100, 1155, 1210, 1265, 1320, 1375, 1430, 1485, 1540, 1595,
1650, 1705, 1760, 1705, 1760, 1815, 1705, 1705, 1760, 1870,
1925, 1980, 2035, 2090, 2145, 2200, 1705, 1760, 2255, 2310,
2365, 1705, 2420, 2420, 2475, 2530, 2585, 2255, 2640, 2695,
1705, 2750, 2805, 2860, 2915, 1705, 2970, 3025, 3080, 3135,
3190, 1705, 3245, 3300, 3355, 3410, 3465, 3520, 3575, 3630,
3630, 3685, 3740, 3795, 3850, 3850, 3905, 3960, 4015, 4070,
4070, 4125, 4180, 4235, 4290, 1705, 4345, 4345, 4400, 4455,
4510, 4565, 1705, 1705, 1760, 1705, 1705, 4620, 4675, 4730,
4785, 4840, 4895, 4950, 5005, 5060, 1705, 5115, 5170, 1705,
1705, 2420, 5225, 2530, 1705, 5280, 2585, 1705, 2970, 5335,
3080, 1705, 5390, 3135, 4620, 5445, 5500, 5555, 3410, 1705,
5610, 5665, 3630, 3685, 3630, 5720, 3740, 1705, 5775, 5830,
5885, 5885, 5940, 5995, 3850, 3905, 3850, 6050, 3960, 1705,
6105, 4015, 4070, 6160, 4125, 1705, 6215, 6270, 6325, 6325,
6380, 6435, 6490, 4345, 6545, 4400, 1705, 6600, 6655, 6710,
6710, 6765, 6820, 6875, 6930, 6985, 7040, 7095, 1705, 7150,
7205, 1705, 1705, 1705, 2035, 7260, 7315, 7370, 7425, 7480,
7535, 5775, 7590, 7590, 6215, 7645, 7645, 7700, 6600, 7755,
7755, 7810, 1705, 7865, 7920, 7975, 1705, 8030, 8085, 8140,
8195, 8250, 8305, 8360, 5940, 6380, 8415, 6765, 8470, 8525,
8580, 1705, 8635, 8690, 8745, 8800, 8855, 8910, 8965, 9020,
9075, 9130, 9185, 9240, 9295, 1705, 1705, 9350, 9405, 9460,
9515, 1705, 1705, 1705, 9570, 9625, 9680, 9735, 9790, 9845,
1705, 9900, 4235, 4510, 9955, 10010, 10065, 10120, 2035
};
/**
* The packed transition table of the DFA
*/
final private static String yy_packed =
"\1\34\1\35\14\34\1\36\4\34\1\37\43\34\1\40"+
"\1\41\65\40\1\42\1\43\10\42\1\44\12\42\1\45"+
"\41\42\1\46\1\47\65\46\1\42\1\43\5\42\1\50"+
"\15\42\1\45\42\42\1\43\2\42\1\51\1\52\2\42"+
"\1\53\3\42\1\53\3\42\1\52\4\42\1\52\1\54"+
"\1\55\16\53\1\42\12\53\1\42\3\53\1\42\1\53"+
"\1\42\1\43\2\42\1\51\1\56\12\42\1\56\4\42"+
"\1\56\41\42\1\57\1\60\2\57\1\61\20\57\1\45"+
"\41\57\1\42\1\43\2\42\1\62\1\52\2\42\1\63"+
"\3\42\1\63\3\42\1\52\4\42\1\52\20\63\1\42"+
"\12\63\1\42\3\63\1\42\1\63\1\42\1\43\2\42"+
"\1\62\1\52\2\42\1\63\3\42\1\63\3\42\1\52"+
"\4\42\1\52\20\63\1\64\12\63\1\42\3\63\1\42"+
"\1\63\1\65\1\43\1\42\1\66\1\67\1\52\7\65"+
"\1\70\1\65\1\71\1\52\4\65\1\52\41\65\1\42"+
"\1\43\2\42\1\72\20\42\1\45\41\42\1\73\1\74"+
"\1\75\1\76\4\73\1\77\3\73\1\77\11\73\20\100"+
"\1\73\12\100\1\73\3\100\1\73\1\100\1\42\1\74"+
"\1\75\1\76\1\42\1\52\2\42\5\101\3\42\1\52"+
"\4\42\1\52\20\101\1\42\12\101\1\42\3\101\1\42"+
"\1\101\1\42\1\74\1\75\1\76\1\42\1\52\2\42"+
"\5\101\3\42\1\52\4\42\1\52\20\101\1\102\12\101"+
"\1\42\3\101\1\42\1\101\1\103\1\74\1\75\1\104"+
"\1\103\1\52\7\103\1\105\1\103\1\106\1\52\4\103"+
"\1\52\41\103\1\42\1\107\1\110\2\42\1\52\12\42"+
"\1\52\4\42\1\52\7\42\1\111\1\112\2\42\1\113"+
"\7\42\1\113\1\42\1\112\1\111\13\42\1\43\1\110"+
"\2\42\1\52\3\42\1\114\6\42\1\52\4\42\1\52"+
"\42\42\1\43\1\110\2\42\1\52\2\42\1\115\1\114"+
"\2\42\1\115\3\42\1\52\4\42\1\52\20\115\1\42"+
"\12\115\1\42\3\115\1\42\1\115\1\42\1\43\1\110"+
"\2\42\1\52\3\42\1\114\6\42\1\52\4\42\1\52"+
"\14\42\1\116\5\42\1\117\5\42\1\116\10\42\1\120"+
"\1\43\1\110\1\121\1\120\1\52\3\120\1\122\3\120"+
"\1\123\1\120\1\124\1\52\4\120\1\52\41\120\1\125"+
"\1\43\1\110\1\126\1\125\1\52\3\125\1\127\3\125"+
"\1\130\1\125\1\131\1\52\4\125\1\52\41\125\1\132"+
"\1\43\1\110\1\133\1\132\1\52\7\132\1\134\1\132"+
"\1\135\1\52\4\132\1\52\41\132\1\136\1\137\1\140"+
"\64\136\1\141\1\43\1\110\1\142\1\141\1\52\7\141"+
"\1\143\1\141\1\144\1\52\4\141\1\52\41\141\1\145"+
"\1\146\1\147\64\145\1\150\1\151\65\150\1\34\1\0"+
"\14\34\1\0\4\34\1\0\43\34\3\0\1\152\1\153"+
"\17\0\1\154\47\0\1\155\2\0\1\156\3\0\1\157"+
"\3\0\1\155\4\0\1\155\20\156\1\0\12\156\1\0"+
"\3\156\1\0\1\156\5\0\1\155\2\0\1\160\3\0"+
"\1\160\3\0\1\155\2\0\1\161\1\0\1\155\20\160"+
"\1\0\12\160\1\0\3\160\1\0\1\160\113\0\1\162"+
"\54\0\1\163\63\0\1\164\61\0\1\165\71\0\1\52"+
"\12\0\1\52\4\0\1\52\47\0\7\53\4\0\1\53"+
"\4\0\20\53\1\0\12\53\1\0\5\53\6\0\7\53"+
"\4\0\1\53\4\0\2\53\2\166\14\53\1\0\12\53"+
"\1\0\5\53\6\0\7\53\4\0\1\53\4\0\2\53"+
"\1\166\1\167\14\53\1\0\12\53\1\0\5\53\5\0"+
"\1\56\12\0\1\56\4\0\1\56\43\0\1\170\66\0"+
"\1\171\72\0\7\63\4\0\1\63\4\0\20\63\1\0"+
"\12\63\1\0\5\63\1\65\2\0\1\172\1\65\1\0"+
"\7\65\1\0\1\65\2\0\4\65\1\0\42\65\1\0"+
"\1\171\1\172\1\65\1\0\7\65\1\0\1\65\2\0"+
"\4\65\1\0\41\65\1\70\2\173\1\174\1\70\1\173"+
"\7\70\1\175\1\70\2\173\4\70\1\173\41\70\1\71"+
"\2\176\1\177\1\71\1\176\7\71\1\176\1\71\1\175"+
"\1\176\4\71\1\176\41\71\1\73\3\0\22\73\20\0"+
"\1\73\12\0\1\73\3\0\1\73\4\0\1\152\20\0"+
"\1\154\44\0\1\200\64\0\1\73\3\0\2\73\7\77"+
"\4\73\1\77\4\73\20\100\1\73\12\100\1\73\3\100"+
"\1\77\1\100\6\0\7\100\4\0\1\100\4\0\20\100"+
"\1\0\12\100\1\0\5\100\6\0\7\101\4\0\1\101"+
"\4\0\20\101\1\0\12\101\1\0\5\101\1\103\2\0"+
"\1\201\1\103\1\0\7\103\1\0\1\103\2\0\4\103"+
"\1\0\42\103\1\0\1\200\1\201\1\103\1\0\7\103"+
"\1\0\1\103\2\0\4\103\1\0\41\103\1\105\2\202"+
"\1\203\1\105\1\202\7\105\1\204\1\105\2\202\4\105"+
"\1\202\41\105\1\106\2\205\1\206\1\106\1\205\7\106"+
"\1\205\1\106\1\204\1\205\4\106\1\205\41\106\3\0"+
"\1\152\20\0\1\207\106\0\1\210\61\0\1\211\12\0"+
"\1\211\46\0\2\212\33\0\12\213\1\214\54\213\6\0"+
"\7\115\4\0\1\115\4\0\20\115\1\0\12\115\1\0"+
"\5\115\47\0\1\215\5\0\1\215\71\0\1\216\6\0"+
"\1\120\2\0\1\217\1\120\1\0\7\120\1\0\1\120"+
"\2\0\4\120\1\0\41\120\1\122\2\213\1\220\1\122"+
"\1\213\4\122\1\221\2\122\1\213\1\122\2\213\4\122"+
"\1\213\41\122\1\123\2\222\1\223\1\123\1\222\7\123"+
"\1\224\1\123\2\222\4\123\1\222\41\123\1\225\2\226"+
"\1\227\1\230\1\226\3\230\2\225\2\230\1\226\1\225"+
"\1\231\1\232\4\230\1\232\36\230\2\225\1\230\1\125"+
"\2\0\1\233\1\125\1\0\7\125\1\0\1\125\2\0"+
"\4\125\1\0\41\125\1\127\2\213\1\234\1\127\1\213"+
"\4\127\1\235\2\127\1\213\1\127\2\213\4\127\1\213"+
"\41\127\1\130\2\236\1\237\1\130\1\236\7\130\1\240"+
"\1\130\2\236\4\130\1\236\41\130\1\131\2\241\1\242"+
"\1\131\1\241\7\131\1\241\1\131\1\240\1\241\4\131"+
"\1\241\41\131\1\132\2\0\1\243\1\132\1\0\7\132"+
"\1\0\1\132\2\0\4\132\1\0\41\132\1\134\2\244"+
"\1\245\1\134\1\244\7\134\1\246\1\134\2\244\4\134"+
"\1\244\41\134\1\247\2\250\1\251\1\252\1\250\3\252"+
"\2\247\2\252\1\250\1\247\1\253\1\254\4\252\1\254"+
"\36\252\2\247\1\252\2\136\1\0\66\136\1\0\21\136"+
"\1\255\42\136\1\141\2\0\1\256\1\141\1\0\7\141"+
"\1\0\1\141\2\0\4\141\1\0\41\141\1\143\2\257"+
"\1\260\1\143\1\257\7\143\1\261\1\143\2\257\4\143"+
"\1\257\41\143\1\262\2\263\1\264\1\265\1\263\3\265"+
"\2\262\2\265\1\263\1\262\1\266\1\267\4\265\1\267"+
"\36\265\2\262\1\265\2\145\1\0\66\145\1\0\21\145"+
"\1\270\42\145\7\0\1\271\1\0\1\272\62\0\1\155"+
"\2\0\1\34\3\0\1\34\3\0\1\155\4\0\1\155"+
"\20\34\1\0\12\34\1\0\3\34\1\0\1\34\1\273"+
"\1\0\3\273\1\274\7\156\1\273\1\0\1\273\1\274"+
"\1\156\1\273\1\0\1\273\1\274\20\156\1\273\12\156"+
"\1\275\5\156\1\273\1\0\3\273\1\274\7\156\1\273"+
"\1\0\1\273\1\274\1\276\1\273\1\0\1\273\1\274"+
"\1\156\1\277\16\156\1\273\12\156\1\275\5\156\1\273"+
"\1\0\3\273\1\274\7\160\1\273\1\0\1\273\1\274"+
"\1\160\1\273\1\0\1\273\1\274\20\160\1\273\12\160"+
"\1\300\5\160\23\0\1\161\54\0\1\272\57\0\1\301"+
"\66\0\1\302\72\0\7\53\4\0\1\53\4\0\4\53"+
"\2\303\12\53\1\0\12\53\1\0\5\53\6\0\7\53"+
"\4\0\1\53\4\0\4\53\1\303\1\304\12\53\1\0"+
"\12\53\1\0\5\53\15\173\1\175\51\173\17\176\1\175"+
"\47\176\15\202\1\204\51\202\17\205\1\204\47\205\34\0"+
"\1\305\26\0\1\305\42\0\1\306\12\0\1\306\55\0"+
"\1\307\7\0\1\307\57\0\1\310\13\0\1\310\72\0"+
"\1\311\4\0\15\222\1\224\51\222\1\225\2\226\1\312"+
"\1\225\1\226\7\225\1\226\1\225\1\224\1\226\4\225"+
"\1\226\41\225\17\226\1\224\47\226\1\225\2\226\1\312"+
"\1\225\1\226\7\225\1\226\1\225\1\313\1\226\4\225"+
"\1\226\41\225\17\0\1\314\47\0\17\226\1\313\47\226"+
"\15\236\1\240\51\236\17\241\1\240\47\241\15\244\1\246"+
"\51\244\1\247\2\250\1\315\1\247\1\250\7\247\1\250"+
"\1\247\1\246\1\250\4\247\1\250\41\247\17\250\1\246"+
"\47\250\1\247\2\250\1\315\1\247\1\250\7\247\1\250"+
"\1\247\1\316\1\250\4\247\1\250\41\247\17\0\1\317"+
"\47\0\17\250\1\316\47\250\2\136\1\0\6\136\1\320"+
"\55\136\15\257\1\261\51\257\1\262\2\263\1\321\1\262"+
"\1\263\7\262\1\263\1\262\1\261\1\263\4\262\1\263"+
"\41\262\17\263\1\261\47\263\1\262\2\263\1\321\1\262"+
"\1\263\7\262\1\263\1\262\1\322\1\263\4\262\1\263"+
"\41\262\17\0\1\323\47\0\17\263\1\322\47\263\2\145"+
"\1\0\6\145\1\324\55\145\7\0\1\325\113\0\1\326"+
"\32\0\1\273\1\0\14\273\1\0\4\273\1\0\35\273"+
"\1\0\6\273\1\0\3\273\1\274\2\273\1\327\3\273"+
"\1\327\1\273\1\0\1\273\1\274\2\273\1\0\1\273"+
"\1\274\20\327\1\273\12\327\1\330\3\327\1\273\1\327"+
"\1\273\1\0\3\273\1\274\7\156\1\273\1\0\1\273"+
"\1\274\1\276\1\273\1\0\1\273\1\274\20\156\1\273"+
"\12\156\1\331\5\156\1\273\1\0\3\273\1\274\7\156"+
"\1\273\1\0\1\273\1\274\1\332\1\273\1\0\1\273"+
"\1\274\6\156\3\332\2\156\1\332\4\156\1\273\2\156"+
"\1\332\1\156\2\332\2\156\1\332\1\156\1\275\2\332"+
"\3\156\6\0\1\53\1\333\5\53\4\0\1\53\4\0"+
"\20\53\1\0\12\53\1\0\5\53\37\0\1\334\12\0"+
"\1\334\46\0\2\335\63\0\2\336\74\0\1\337\12\0"+
"\1\337\46\0\2\340\36\0\2\341\1\0\3\341\2\0"+
"\2\341\2\0\1\231\44\341\2\0\1\341\3\0\2\342"+
"\1\0\3\342\2\0\2\342\2\0\1\253\44\342\2\0"+
"\1\342\2\136\1\0\31\136\1\343\32\136\3\0\2\344"+
"\1\0\3\344\2\0\2\344\2\0\1\266\44\344\2\0"+
"\1\344\2\145\1\0\31\145\1\345\32\145\35\0\1\346"+
"\31\0\1\273\1\0\3\273\1\347\7\327\1\273\1\0"+
"\1\273\1\347\1\327\1\273\1\0\1\273\1\347\20\327"+
"\1\273\12\327\1\350\5\327\61\0\1\330\5\0\1\273"+
"\1\0\3\273\1\274\7\156\1\273\1\0\1\273\1\274"+
"\1\332\1\273\1\0\1\273\1\274\6\156\3\332\2\156"+
"\1\332\4\156\1\273\2\156\1\332\1\156\2\332\2\156"+
"\1\332\1\156\1\331\2\332\3\156\6\0\7\53\4\0"+
"\1\53\4\0\14\53\1\351\3\53\1\0\12\53\1\0"+
"\5\53\47\0\1\352\5\0\1\352\54\0\1\353\64\0"+
"\1\354\7\0\1\354\56\0\1\355\7\0\1\355\60\0"+
"\1\356\23\0\2\136\1\0\32\136\1\357\31\136\2\145"+
"\1\0\32\145\1\360\31\145\36\0\1\361\30\0\1\273"+
"\1\0\3\273\1\347\2\273\1\327\3\273\1\327\1\273"+
"\1\0\1\273\1\347\2\273\1\0\1\273\1\347\20\327"+
"\1\273\12\327\1\0\3\327\1\273\1\327\6\0\7\53"+
"\4\0\1\53\4\0\20\53\1\0\3\53\1\362\6\53"+
"\1\0\5\53\50\0\1\363\60\0\1\364\13\0\1\364"+
"\55\0\1\365\51\0\2\366\71\0\1\367\26\0\1\367"+
"\3\0\2\136\1\0\33\136\1\370\30\136\2\145\1\0"+
"\33\145\1\371\30\145\37\0\1\372\35\0\7\53\4\0"+
"\1\53\4\0\20\53\1\0\6\53\1\373\3\53\1\0"+
"\5\53\41\0\1\374\7\0\1\374\54\0\1\375\12\0"+
"\1\375\53\0\1\376\12\0\1\376\14\0\2\136\1\0"+
"\34\136\1\377\27\136\2\145\1\0\34\145\1\u0100\27\145"+
"\36\0\1\u0101\36\0\7\53\4\0\1\53\4\0\5\53"+
"\1\u0102\12\53\1\0\12\53\1\0\5\53\2\136\1\0"+
"\33\136\1\u0103\30\136\2\145\1\0\33\145\1\u0104\30\145"+
"\11\0\1\u0105\63\0\7\53\4\0\1\53\4\0\13\53"+
"\1\u0106\4\53\1\0\12\53\1\0\5\53\2\136\1\0"+
"\6\136\1\u0107\55\136\2\145\1\0\6\145\1\u0108\55\145"+
"\6\0\7\53\4\0\1\53\4\0\14\53\1\u0109\3\53"+
"\1\0\12\53\1\0\5\53\6\0\7\53\4\0\1\53"+
"\4\0\20\53\1\0\12\53\1\0\4\53\1\u010a\6\0"+
"\7\53\4\0\1\53\4\0\13\53\1\u010b\4\53\1\0"+
"\12\53\1\0\5\53\6\0\7\53\4\0\1\53\4\0"+
"\13\53\1\u010c\4\53\1\0\12\53\1\0\5\53\6\0"+
"\7\53\4\0\1\53\4\0\20\53\1\0\3\53\1\u010d"+
"\6\53\1\0\5\53";
/**
* The transition table of the DFA
*/
final private static int yytrans [] = yy_unpack(yy_packed);
/* error codes */
final private static int YY_UNKNOWN_ERROR = 0;
// final private static int YY_ILLEGAL_STATE = 1;
final private static int YY_NO_MATCH = 2;
final private static int YY_PUSHBACK_2BIG = 3;
/* error messages for the codes above */
final private static String YY_ERROR_MSG[] = {
"Unkown internal scanner error", //$NON-NLS-1$
"Internal error: unknown state", //$NON-NLS-1$
"Error: could not match input", //$NON-NLS-1$
"Error: pushback value was too large" //$NON-NLS-1$
};
/**
* YY_ATTRIBUTE[aState] contains the attributes of state <code>aState</code>
*/
private final static byte YY_ATTRIBUTE[] = {
1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 9,
1, 9, 1, 1, 9, 9, 1, 1, 1, 1, 1, 1, 1, 1, 9, 1,
1, 1, 1, 9, 1, 1, 1, 1, 1, 1, 1, 1, 9, 1, 1, 1,
1, 9, 1, 1, 1, 1, 1, 9, 1, 1, 1, 1, 1, 1, 1, 1,
1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 9,
1, 1, 1, 1, 1, 1, 9, 9, 1, 9, 9, 1, 0, 1, 1, 1,
1, 0, 0, 0, 9, 1, 1, 9, 9, 0, 0, 0, 9, 0, 0, 9,
0, 0, 0, 9, 0, 0, 0, 0, 0, 0, 0, 9, 0, 0, 0, 0,
1, 0, 0, 9, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 9,
0, 0, 0, 0, 0, 9, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0,
9, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 9, 1, 1, 9,
9, 9, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1,
0, 1, 0, 1, 9, 0, 1, 1, 9, 1, 1, 0, 0, 0, 0, 0,
0, 0, 1, 0, 1, 0, 1, 9, 1, 0, 0, 0, 0, 0, 1, 1,
0, 1, 0, 0, 0, 9, 9, 1, 1, 0, 1, 9, 9, 9, 1, 1,
0, 1, 1, 1, 9, 1, 1, 1, 1, 1, 1, 1, 1
};
/** the input device */
private java.io.Reader yy_reader;
/** the current state of the DFA */
private int yy_state;
/** the current lexical state */
private int yy_lexical_state = YYINITIAL;
/** this buffer contains the current text to be matched and is
the source of the yytext() string */
private char yy_buffer[] = new char[16384];
/** the textposition at the last accepting state */
private int yy_markedPos;
/** the current text position in the buffer */
private int yy_currentPos;
/** startRead marks the beginning of the yytext() string in the buffer */
private int yy_startRead;
/** endRead marks the last character in the buffer, that has been read
from input */
private int yy_endRead;
/** number of newlines encountered up to the start of the matched text */
// private int yyline;
/** the number of characters up to the start of the matched text */
private int yychar;
/**
* the number of characters from the last newline up to the start of the
* matched text
*/
// private int yycolumn;
/**
* yy_atBOL == true <=> the scanner is currently at the beginning of a line
*/
// private boolean yy_atBOL;
/** yy_atEOF == true <=> the scanner has returned a value for EOF */
private boolean yy_atEOF;
/** denotes if the user-EOF-code has already been executed */
private boolean yy_eof_done;
/* user code: */
private int fTokenCount = 0;
// required holders for white-space compacting
private boolean fShouldLoadBuffered = false;
private String fBufferedContext = null;
private int fBufferedStart = 1;
private int fBufferedLength = 0;
private String f_context = null;
// state stack for handling embedded regions
private IntStack fStateStack = new IntStack();
private String context = null;
private int start = 0;
private int textLength = 0;
private int length = 0;
// offset for tracking position specific block tags
private int fOffset = 0;
// the name of the current tag being opened
private String fCurrentTagName = null;
// the list of tag name BlockMarkers
private List fBlockMarkers = new ArrayList();
// required to not seek text blocks on an end tag
private boolean fIsBlockingEnabled = false;
private boolean fIsCaseSensitiveBlocking = true;
private XMLParserRegionFactory fRegionFactory = new XMLParserRegionFactory();
/**
* user method
*/
public final void addBlockMarker(BlockMarker marker) {
if(containsTagName(marker.getTagName()))
return;
fBlockMarkers.add(marker);
}
/**
* user method
*/
public final void removeBlockMarker(BlockMarker marker) {
fBlockMarkers.remove(marker);
}
/**
* user method
*/
public final void removeBlockMarker(String tagname) {
if (fBlockMarkers != null) {
Iterator blocks = fBlockMarkers.iterator();
while (blocks.hasNext()) {
if (((BlockMarker) blocks.next()).getTagName().equals(tagname))
blocks.remove();
}
}
}
/* user method */
public final boolean isCaseSensitiveBlocking() {
return fIsCaseSensitiveBlocking;
}
/* user method */
public final void setCaseSensitiveBlocking(boolean newValue) {
fIsCaseSensitiveBlocking = newValue;
}
/* user method */
public boolean getBlockMarkerCaseSensitivity() {
return getBlockMarkerCaseSensitivity(fCurrentTagName);
}
/* user method */
public boolean getBlockMarkerCaseSensitivity(String name) {
Iterator iterator = fBlockMarkers.iterator();
while(iterator.hasNext()) {
BlockMarker marker = (BlockMarker)iterator.next();
boolean casesensitive = marker.isCaseSensitive();
if(casesensitive && marker.getTagName().equals(name))
return casesensitive;
else if(!casesensitive && marker.getTagName().equalsIgnoreCase(name))
return casesensitive;
}
return true;
}
/* user method */
public String getBlockMarkerContext() {
return getBlockMarkerContext(fCurrentTagName);
}
/* user method */
public String getBlockMarkerContext(String name) {
Iterator iterator = fBlockMarkers.iterator();
while(iterator.hasNext()) {
BlockMarker marker = (BlockMarker)iterator.next();
if(marker.getTagName().equals(name))
return marker.getContext();
}
return BLOCK_TEXT;
}
/* user method */
public List getBlockMarkers() {
return fBlockMarkers;
}
/* user method */
public final int getOffset() {
return fOffset + yychar;
}
private final boolean isBlockMarker() {
return isBlockMarker(fCurrentTagName);
}
private final boolean isBlockMarker(String tagName) {
if (!fIsBlockingEnabled)
return false;
return containsTagName(tagName);
}
/**
* user method
*/
public final void beginBlockTagScan(String newTagName) {
beginBlockMarkerScan(newTagName, BLOCK_TEXT);
}
/**
* user method
*
* Special tokenizer setup. Allows tokenization to be initiated at the
* start of a text block within a "newTagName" tag.
*
* Example:
* Tokenizer toker = new Tokenizer();
* toker.setCaseSensitiveBlocking(false);
* toker.reset(new java.io.StringReader("afiuhqwkejhtasihgalkwhtq</scripter></scr></script>asgdasga"));
* toker.beginBlockMarkerScan("script", BLOCK_TEXT);
* toker.getRegions();
*
* Returns:
* BLOCK_TEXT: 0-40
* XML_END_TAG_OPEN: 41-42
* XML_TAG_NAME: 43-48
* XML_TAG_CLOSE: 49-49
* XML_CONTENT: 50-57
*
*/
public final void beginBlockMarkerScan(String newTagName, String blockcontext) {
yybegin(ST_BLOCK_TAG_SCAN);
fCurrentTagName = newTagName;
}
/**
* Method doScan.
*
* Returns a context region for all of the text from the current position upto the end of input or
* to right *before* the first occurence of searchString
*
* @param searchString - target string to search for ex.: "-->", "</tagname"
* @param requireTailSeparator - whether the target must be immediately followed by whitespace or '>'
* @param context - the context of the scanned region if non-zero length
* @param exitState - the state to go to if the region was of non-zero length
* @param abortState - the state to go to if the searchString was found immediately
* @return String - the context found: the desired context on a non-zero length match, the abortContext on immediate success
* @throws IOException
*/
private final String doScan(String searchString, boolean requireTailSeparator, String searchContext, int exitState, int immediateFallbackState) throws IOException {
boolean stillSearching = true;
// Disable further block (probably)
fIsBlockingEnabled = false;
int searchStringLength = searchString.length();
int n = 0;
char lastCheckChar;
int i;
boolean same = false;
while (stillSearching) {
n = 0;
// Ensure that enough data from the input exists to compare against the search String.
n = yy_advance();
while(n != YYEOF && yy_currentPos < searchStringLength)
n = yy_advance();
// If the input was too short or we've exhausted the input, stop immediately.
if (n == YYEOF) {
stillSearching = false;
}
else {
same = true;
// Ensure that we've not encountered a complete block (<%%>) that was *shorter* than the closeTagString and
// thus found twice at current-targetLength [since the first scan would have come out this far anyway].
// Check the characters in the target versus the last targetLength characters read from the buffer
// and see if it matches
// safety check for array accesses (yy_currentPos is the *last* character we can check against)
if(yy_currentPos >= searchStringLength && yy_currentPos <= yy_buffer.length) {
for(i = 0; i < searchStringLength; i++) {
if(same && fIsCaseSensitiveBlocking)
same = yy_buffer[i + yy_currentPos - searchStringLength] == searchString.charAt(i);
else if(same && !fIsCaseSensitiveBlocking)
same = Character.toLowerCase(yy_buffer[i + yy_currentPos - searchStringLength]) == Character.toLowerCase(searchString.charAt(i));
}
}
// safety check failed; no match is possible right now
else {
same = false;
}
if (same && requireTailSeparator && yy_currentPos < yy_buffer.length) {
// Additional check for close tags to ensure that targetString="</script" doesn't match
// "</scriptS"
lastCheckChar = yy_buffer[yy_currentPos];
// Succeed on "</script>" and "</script "
if(lastCheckChar == '>' || Character.isWhitespace(lastCheckChar))
stillSearching = false;
}
else {
stillSearching = !same || (yy_currentPos < yy_startRead + searchStringLength);
}
}
}
if (n != YYEOF || same) {
// We've stopped short of the end or definitely found a match
yy_markedPos = yy_currentPos - searchStringLength;
yy_currentPos = yy_markedPos + 1;
// If the searchString occurs at the very beginning of what would have
// been a Block, resume scanning normally immediately
if (yy_markedPos == yy_startRead) {
yybegin(immediateFallbackState);
return primGetNextToken();
}
}
else {
// We ran through the rest of the input
yy_markedPos = yy_currentPos;
yy_currentPos++;
}
yybegin(exitState);
// If the ending occurs at the very beginning of what would have
// been a Block, resume scanning normally immediately
if(yy_markedPos == yy_startRead)
return primGetNextToken();
return searchContext;
}
/**
* user method
*
* A generic lookahead-like operation
*/
private final String doBlockScan(String target, String targetContext, int immediateFallbackState) throws IOException {
return doScan(target, false, targetContext, immediateFallbackState, immediateFallbackState);
}
/**
* user method
* does a lookahead for the current tag name
*/
private final String doBlockTagScan() throws IOException {
fIsCaseSensitiveBlocking = getBlockMarkerCaseSensitivity();
return doScan("</" + fCurrentTagName, true, getBlockMarkerContext(fCurrentTagName), YYINITIAL, YYINITIAL);
}
/**
* user method
*
* Converts the raw context String returned by the primGetNextToken()
* method into a full ITextRegion by pulling in values for the
* current offset within the scanning text.
*
* Returns null when EOF is encountered and attaches intermittently
* discovered whitespace onto the end of useful regions.
*
* Note that this algorithm caches the token following the one being returned
* so that whitespace can be collapsed.
*/
public final ITextRegion getNextToken() throws IOException {
// load the starting non-whitespace token (assume that it is so)
if (fShouldLoadBuffered) {
context = fBufferedContext;
start = fBufferedStart;
textLength = length = fBufferedLength;
fShouldLoadBuffered = false;
}
else {
context = primGetNextToken();
if (context == XML_TAG_NAME) {
if(containsTagName(yy_buffer, yy_startRead, yy_markedPos-yy_startRead))
fCurrentTagName = yytext();
else
fCurrentTagName = null;
}
else if (context == XML_TAG_OPEN) {
fIsBlockingEnabled = true;
}
else if (context == XML_END_TAG_OPEN) {
fIsBlockingEnabled = false;
}
start = yychar;
textLength = length = yylength();
if (yy_atEOF) {
fTokenCount++;
return null;
}
}
// store the next token
f_context = primGetNextToken();
if (f_context == XML_TAG_NAME) {
if(containsTagName(yy_buffer, yy_startRead, yy_markedPos-yy_startRead))
fCurrentTagName = yytext();
else
fCurrentTagName = null;
}
else if (f_context == XML_TAG_OPEN) {
fIsBlockingEnabled = true;
}
else if (f_context == XML_END_TAG_OPEN) {
fIsBlockingEnabled = false;
}
fBufferedContext = f_context;
fBufferedStart = yychar;
fBufferedLength = yylength();
fShouldLoadBuffered = true;
if (fBufferedContext == WHITE_SPACE) {
fShouldLoadBuffered = false;
length += fBufferedLength;
}
if (context == null) {
// EOF
if (Debug.debugTokenizer) {
System.out.println(getClass().getName() + " discovered " + fTokenCount + " tokens."); //$NON-NLS-2$//$NON-NLS-1$
}
return null;
}
fTokenCount++;
return fRegionFactory.createToken(context, start, textLength, length, null, fCurrentTagName);
}
/* user method */
public HTMLTokenizer(){
super();
}
/* user method */
public HTMLTokenizer(char[] charArray){
this(new CharArrayReader(charArray));
}
/* user method */
public void reset(char[] charArray) {
reset(new CharArrayReader(charArray), 0);
}
/* user method */
public void reset(char[] charArray, int newOffset) {
reset(new CharArrayReader(charArray), newOffset);
}
/* user method */
public void reset(java.io.InputStream in) {
reset(new java.io.InputStreamReader(in), 0);
}
/* user method */
public void reset(java.io.InputStream in, int newOffset) {
reset(new java.io.InputStreamReader(in), newOffset);
}
/* user method */
public void reset(java.io.Reader in) {
reset(in, 0);
}
/**
* user method *
*
* Reset internal counters and vars to "newly created" values, in the hopes
* that resetting a pre-existing tokenizer is faster than creating a new one.
*
* This method contains code blocks that were essentially duplicated from the
* <em>generated</em> output of this specification before this method was
* added. Those code blocks were under the above copyright.
*/
public void reset(java.io.Reader in, int newOffset) {
if (Debug.debugTokenizer) {
System.out.println("resetting tokenizer");//$NON-NLS-1$
}
fOffset = newOffset;
/* the input device */
yy_reader = in;
/* the current state of the DFA */
yy_state = 0;
/* the current lexical state */
yy_lexical_state = YYINITIAL;
/* this buffer contains the current text to be matched and is
the source of the yytext() string */
java.util.Arrays.fill(yy_buffer, (char)0);
/* the textposition at the last accepting state */
yy_markedPos = 0;
/* the current text position in the buffer */
yy_currentPos = 0;
/* startRead marks the beginning of the yytext() string in the buffer */
yy_startRead = 0;
/**
* endRead marks the last character in the buffer, that has been read
* from input
*/
yy_endRead = 0;
/* number of newlines encountered up to the start of the matched text */
//yyline = 0;
/* the number of characters up to the start of the matched text */
yychar = 0;
/* yy_atEOF == true <=> the scanner has returned a value for EOF */
yy_atEOF = false;
/* denotes if the user-EOF-code has already been executed */
yy_eof_done = false;
/* user vars: */
fTokenCount = 0;
fShouldLoadBuffered = false;
fBufferedContext = null;
fBufferedStart = 1;
fBufferedLength = 0;
fStateStack = new IntStack();
context = null;
start = 0;
textLength = 0;
length = 0;
}
/**
* user method
*
*/
public BlockTokenizer newInstance() {
HTMLTokenizer newInstance = new HTMLTokenizer();
// global tagmarkers can be shared; they have no state and
// are never destroyed (e.g. 'release')
for(int i = 0; i < fBlockMarkers.size(); i++) {
BlockMarker blockMarker = (BlockMarker) fBlockMarkers.get(i);
if(blockMarker.isGlobal())
newInstance.addBlockMarker(blockMarker);
}
return newInstance;
}
/* user method */
private final String scanXMLCommentText() throws IOException {
// Scan for '-->' and return the text up to that point as
// XML_COMMENT_TEXT unless the string occurs IMMEDIATELY, in which
// case change to the ST_XML_COMMENT_END state and return the next
// context as usual.
return doScan("-->", false, XML_COMMENT_TEXT, ST_XML_COMMENT_END, ST_XML_COMMENT_END);
}
/**
* Creates a new scanner
* There is also a java.io.InputStream version of this constructor.
*
* @param in the java.io.Reader to read input from.
*/
public HTMLTokenizer(java.io.Reader in) {
this.yy_reader = in;
}
/**
* Creates a new scanner.
* There is also java.io.Reader version of this constructor.
*
* @param in the java.io.Inputstream to read input from.
*/
public HTMLTokenizer(java.io.InputStream in) {
this(new java.io.InputStreamReader(in));
}
/**
* Unpacks the compressed DFA transition table.
*
* @param packed the packed transition table
* @return the unpacked transition table
*/
private static int [] yy_unpack(String packed) {
int [] trans = new int[10175];
int i = 0; /* index in packed string */
int j = 0; /* index in unpacked array */
while (i < 3126) {
int count = packed.charAt(i++);
int value = packed.charAt(i++);
value--;
do trans[j++] = value; while (--count > 0);
}
return trans;
}
/**
* Unpacks the compressed character translation table.
*
* @param packed the packed character translation table
* @return the unpacked character translation table
*/
private static char [] yy_unpack_cmap(String packed) {
char [] map = new char[0x10000];
int i = 0; /* index in packed string */
int j = 0; /* index in unpacked array */
while (i < 1372) {
int count = packed.charAt(i++);
char value = packed.charAt(i++);
do map[j++] = value; while (--count > 0);
}
return map;
}
/**
* Gets the next input character.
*
* @return the next character of the input stream, EOF if the
* end of the stream is reached.
* @exception IOException if any I/O-Error occurs
*/
private int yy_advance() throws java.io.IOException {
/* standard case */
if (yy_currentPos < yy_endRead) return yy_buffer[yy_currentPos++];
/* if the eof is reached, we don't need to work hard */
if (yy_atEOF) return YYEOF;
/* otherwise: need to refill the buffer */
/* first: make room (if you can) */
if (yy_startRead > 0) {
System.arraycopy(yy_buffer, yy_startRead,
yy_buffer, 0,
yy_endRead-yy_startRead);
/* translate stored positions */
yy_endRead-= yy_startRead;
yy_currentPos-= yy_startRead;
yy_markedPos-= yy_startRead;
yy_startRead = 0;
}
/* is the buffer big enough? */
if (yy_currentPos >= yy_buffer.length) {
/* if not: blow it up */
char newBuffer[] = new char[yy_currentPos*2];
System.arraycopy(yy_buffer, 0, newBuffer, 0, yy_buffer.length);
yy_buffer = newBuffer;
}
/* finally: fill the buffer with new input */
int numRead = yy_reader.read(yy_buffer, yy_endRead,
yy_buffer.length-yy_endRead);
if ( numRead == -1 ) return YYEOF;
yy_endRead+= numRead;
return yy_buffer[yy_currentPos++];
}
/**
* Closes the input stream.
*/
final public void yyclose() throws java.io.IOException {
yy_atEOF = true; /* indicate end of file */
yy_endRead = yy_startRead; /* invalidate buffer */
yy_reader.close();
}
/**
* Returns the current lexical state.
*/
final public int yystate() {
return yy_lexical_state;
}
/**
* Enters a new lexical state
*
* @param newState the new lexical state
*/
final public void yybegin(int newState) {
yy_lexical_state = newState;
}
/**
* Returns the text matched by the current regular expression.
*/
final public String yytext() {
return new String( yy_buffer, yy_startRead, yy_markedPos-yy_startRead );
}
/**
* Returns the length of the matched text region.
*/
final public int yylength() {
return yy_markedPos-yy_startRead;
}
/**
* Reports an error that occured while scanning - from the SED JFlex skeleton
*
* @param errorCode the code of the errormessage to display
*/
private void yy_ScanError(int errorCode) {
try {
Logger.log(Logger.ERROR, YY_ERROR_MSG[errorCode]);
}
catch (ArrayIndexOutOfBoundsException e) {
Logger.log(Logger.ERROR, YY_ERROR_MSG[YY_UNKNOWN_ERROR]);
}
// DO NOT EXIT the VM on an error
// System.exit(1);
}
/**
* Pushes the specified amount of characters back into the input stream.
*
* They will be read again by then next call of the scanning method
*
* @param number the number of characters to be read again.
* This number must not be greater than yylength()!
*/
void yypushback(int number) {
if ( number > yylength() )
yy_ScanError(YY_PUSHBACK_2BIG);
yy_markedPos -= number;
}
/**
* user method - skeleton.sed
*/
protected final boolean containsTagName(char[] markerTagName, int offset, int tagnameLength) {
for(int j = 0; j < fBlockMarkers.size(); j++) {
BlockMarker marker = (BlockMarker)fBlockMarkers.get(j);
if(marker.getTagName().length() == tagnameLength) {
boolean matchesSoFar = true;
for(int i = 0; i < tagnameLength && matchesSoFar; i++) {
if(marker.isCaseSensitive()) {
if(marker.getTagName().charAt(i) != markerTagName[i + offset])
matchesSoFar = false;
}
else {
if(Character.toLowerCase(marker.getTagName().charAt(i)) != Character.toLowerCase(markerTagName[i + offset]))
matchesSoFar = false;
}
}
if(matchesSoFar)
return true;
}
}
return false;
}
/**
* user method - skeleton.sed
*
* Return ALL of the regions scannable within the remaining text
* Note: for verification use
*/
public final List getRegions() {
List tokens = new ArrayList();
ITextRegion region = null;
try {
region = getNextToken();
while(region != null) {
if (region != null) {
tokens.add(region);
}
region = getNextToken();
}
}
catch (StackOverflowError e) {
Logger.logException(getClass().getName()+": input could not be tokenized correctly at position " + getOffset(), e);//$NON-NLS-1$
throw e;
}
catch (Exception e) {
// Since this is convenience method and NOT the recommended
// way of getting tokens, many errors are simply hidden
Logger.logException("Exception not handled retrieving regions: " + e.getLocalizedMessage(), e);//$NON-NLS-1$
}
return tokens;
}
/**
* user method - skeleton.sed
*/
private final void dump(String s) {
if (Debug.debugTokenizer) {
System.out.println(s + " (" + yychar + "-" + //$NON-NLS-2$//$NON-NLS-1$
(yylength() + yychar) + "):\'" +//$NON-NLS-1$
StringUtils.escape(yytext()) + "\'");//$NON-NLS-1$
}
}
/* user method - skeleton.sed */
public final boolean isEOF() {
return yy_atEOF;
}
/* user method - skeleton.sed */
protected final boolean containsTagName(String markerTagName) {
Iterator blocks = fBlockMarkers.iterator();
while(blocks.hasNext()) {
BlockMarker marker = (BlockMarker)blocks.next();
if(marker.isCaseSensitive()) {
if(marker.getTagName().equals(markerTagName))
return true;
}
else {
if(marker.getTagName().equalsIgnoreCase(markerTagName))
return true;
}
}
return false;
}
/**
* Contains user EOF-code, which will be executed exactly once,
* when the end of file is reached
*/
private void yy_do_eof() {
if (!yy_eof_done) {
yy_eof_done = true;
// do nothing, this is the downstream parser's job
}
}
/**
* Resumes scanning until the next regular expression is matched,
* the end of input is encountered or an I/O-Error occurs.
*
* @return the next token
* @exception IOException if any I/O-Error occurs
*/
public String primGetNextToken() throws java.io.IOException {
int yy_input;
int yy_action;
while (true) {
yychar+= yylength();
yy_action = -1;
yy_currentPos = yy_startRead = yy_markedPos;
yy_state = yy_lexical_state;
yy_forAction: {
while (true) {
yy_input = yy_advance();
if ( yy_input == YYEOF ) break yy_forAction;
int yy_next = yytrans[ yy_rowMap[yy_state] + yycmap[yy_input] ];
if (yy_next == -1) break yy_forAction;
yy_state = yy_next;
int yy_attributes = YY_ATTRIBUTE[yy_state];
if ( (yy_attributes & 1) > 0 ) {
yy_action = yy_state;
yy_markedPos = yy_currentPos;
if ( (yy_attributes & 8) > 0 ) break yy_forAction;
}
}
}
switch (yy_action) {
case 268:
{
if(Debug.debugTokenizer)
dump("XSL processing instruction target");//$NON-NLS-1$
yybegin(ST_XML_PI_ATTRIBUTE_NAME);
return XML_TAG_NAME;
}
case 270: break;
case 260:
case 262:
case 263:
{
if(Debug.debugTokenizer)
dump("\nCDATA start");//$NON-NLS-1$
fStateStack.push(yystate());
yybegin(ST_CDATA_TEXT);
return XML_CDATA_OPEN;
}
case 271: break;
case 253:
{
if(Debug.debugTokenizer)
dump("element");//$NON-NLS-1$
yybegin(ST_XML_ELEMENT_DECLARATION);
return XML_ELEMENT_DECLARATION;
}
case 272: break;
case 252:
{
if(Debug.debugTokenizer)
dump("attlist");//$NON-NLS-1$
yybegin(ST_XML_ATTLIST_DECLARATION);
return XML_ATTLIST_DECLARATION;
}
case 273: break;
case 251:
{
if(Debug.debugTokenizer)
dump("doctype");//$NON-NLS-1$
yybegin(ST_XML_DOCTYPE_DECLARATION);
return XML_DOCTYPE_DECLARATION;
}
case 274: break;
case 246:
{
if(Debug.debugTokenizer)
dump("doctype external id");//$NON-NLS-1$
yybegin(ST_XML_DOCTYPE_ID_PUBLIC);
return XML_DOCTYPE_EXTERNAL_ID_PUBLIC;
}
case 275: break;
case 245:
{
if(Debug.debugTokenizer)
dump("doctype external id");//$NON-NLS-1$
yybegin(ST_XML_DOCTYPE_ID_SYSTEM);
return XML_DOCTYPE_EXTERNAL_ID_SYSTEM;
}
case 276: break;
case 216:
{
if(Debug.debugTokenizer)
dump("\nCharRef");//$NON-NLS-1$
return XML_CHAR_REFERENCE;
}
case 277: break;
case 212:
{
if(Debug.debugTokenizer)
dump("\ncomment start");//$NON-NLS-1$
yybegin(ST_XML_COMMENT);
return XML_COMMENT_OPEN;
}
case 278: break;
case 194:
case 195:
{
if(Debug.debugTokenizer)
dump("XML processing instruction target");//$NON-NLS-1$
yybegin(ST_XML_PI_ATTRIBUTE_NAME);
return XML_TAG_NAME;
}
case 279: break;
case 193:
{
if(Debug.debugTokenizer)
dump("comment end");//$NON-NLS-1$
yybegin(YYINITIAL);
return XML_COMMENT_CLOSE;
}
case 280: break;
case 192:
{
if(Debug.debugTokenizer)
dump("CDATA end");//$NON-NLS-1$
yybegin(fStateStack.pop());
return XML_CDATA_CLOSE;
}
case 281: break;
case 191:
{
if(Debug.debugTokenizer)
dump("\nPEReference");//$NON-NLS-1$
return XML_PE_REFERENCE;
}
case 282: break;
case 188:
{
if(Debug.debugTokenizer)
dump("\nEntityRef");//$NON-NLS-1$
return XML_ENTITY_REFERENCE;
}
case 283: break;
case 139:
case 144:
case 156:
{
return XML_DOCTYPE_INTERNAL_SUBSET;
}
case 284: break;
case 127:
{
yybegin(YYINITIAL);
if(Debug.debugTokenizer)
dump("empty tag close");//$NON-NLS-1$
return XML_EMPTY_TAG_CLOSE;
}
case 285: break;
case 120:
{
if(Debug.debugTokenizer)
dump("XML processing instruction end");//$NON-NLS-1$
yybegin(YYINITIAL);
return XML_PI_CLOSE;
}
case 286: break;
case 119:
{
// ended with nothing inside
yybegin(YYINITIAL);
return XML_PI_CLOSE;
}
case 287: break;
case 52:
case 54:
case 55:
case 56:
case 124:
{
if(Debug.debugTokenizer)
dump("XML processing instruction attribute value");//$NON-NLS-1$
yybegin(ST_XML_PI_ATTRIBUTE_NAME);
return XML_TAG_ATTRIBUTE_VALUE;
}
case 288: break;
case 51:
{
if(Debug.debugTokenizer)
dump("XML processing instruction '='");//$NON-NLS-1$
yybegin(ST_XML_PI_ATTRIBUTE_VALUE);
return XML_TAG_ATTRIBUTE_EQUALS;
}
case 289: break;
case 50:
{
if(Debug.debugTokenizer)
dump("XML processing instruction attribute name");//$NON-NLS-1$
yybegin(ST_XML_PI_EQUALS);
return XML_TAG_ATTRIBUTE_NAME;
}
case 290: break;
case 46:
case 47:
case 48:
{
// block scan until close is found
return doScan("?>", false, XML_PI_CONTENT, ST_XML_PI_TAG_CLOSE, ST_XML_PI_TAG_CLOSE);
}
case 291: break;
case 45:
{
yybegin(ST_PI_CONTENT);
return WHITE_SPACE;
}
case 292: break;
case 42:
case 43:
case 44:
case 117:
case 118:
case 218:
case 232:
case 241:
case 250:
case 257:
case 261:
case 264:
case 265:
case 266:
case 267:
{
if(Debug.debugTokenizer)
dump("processing instruction target");//$NON-NLS-1$
yybegin(ST_PI_WS);
return XML_TAG_NAME;
}
case 293: break;
case 37:
case 38:
{
if(Debug.debugTokenizer)
dump("comment content");//$NON-NLS-1$
return scanXMLCommentText();
}
case 294: break;
case 36:
{
if(Debug.debugTokenizer)
dump("LINE FEED");//$NON-NLS-1$
return WHITE_SPACE;
}
case 295: break;
case 31:
case 32:
{
if(Debug.debugTokenizer)
dump("CDATA text");//$NON-NLS-1$
String blockContext = doBlockScan("]]>", XML_CDATA_TEXT, ST_CDATA_END);//$NON-NLS-1$
if(blockContext == XML_CDATA_TEXT)
yybegin(ST_CDATA_END);
return blockContext;
}
case 296: break;
case 0:
case 27:
case 109:
case 110:
case 111:
case 186:
case 187:
case 189:
case 190:
case 214:
case 215:
case 217:
case 230:
case 231:
{
if(Debug.debugTokenizer)
dump("\nXML content");//$NON-NLS-1$
return XML_CONTENT;
}
case 297: break;
case 5:
case 8:
case 9:
case 10:
case 13:
case 14:
case 15:
case 16:
case 17:
case 18:
case 19:
case 20:
case 21:
case 22:
case 24:
case 41:
{
if(Debug.debugTokenizer)
dump("white space");//$NON-NLS-1$
return WHITE_SPACE;
}
case 298: break;
case 12:
case 58:
{
if(Debug.debugTokenizer)
dump("inappropriate tag name");//$NON-NLS-1$
yybegin(YYINITIAL);
return XML_CONTENT;
}
case 299: break;
case 23:
case 93:
case 94:
case 172:
case 207:
case 226:
case 238:
case 247:
case 254:
case 258:
{
if(Debug.debugTokenizer)
dump("elementdecl contentspec");//$NON-NLS-1$
return XML_ELEMENT_DECL_CONTENT;
}
case 300: break;
case 25:
case 100:
case 101:
case 183:
case 211:
case 228:
case 239:
case 248:
case 255:
case 259:
{
if(Debug.debugTokenizer)
dump("attlist contentspec");//$NON-NLS-1$
return XML_ATTLIST_DECL_CONTENT;
}
case 301: break;
case 28:
case 59:
case 70:
{
if(Debug.debugTokenizer)
dump("\nstart tag open");//$NON-NLS-1$
yybegin(ST_XML_TAG_NAME);
return XML_TAG_OPEN;
}
case 302: break;
case 29:
case 33:
case 34:
case 35:
case 39:
case 40:
case 49:
case 53:
case 57:
case 61:
case 67:
case 72:
case 73:
case 74:
case 75:
case 77:
case 78:
case 80:
case 85:
case 90:
case 97:
{
if (Debug.debugTokenizer)
System.out.println("!!!unexpected!!!: \"" + yytext() + "\":" + //$NON-NLS-2$//$NON-NLS-1$
yychar + "-" + (yychar + yylength()));//$NON-NLS-1$
return UNDEFINED;
}
case 303: break;
case 30:
case 112:
{
if(Debug.debugTokenizer)
dump("non-reference %");//$NON-NLS-1$
return XML_CONTENT;
}
case 304: break;
case 60:
{
if(Debug.debugTokenizer)
dump("tag close");//$NON-NLS-1$
if(isBlockMarker()) {
yybegin(ST_BLOCK_TAG_SCAN);
}
else
yybegin(YYINITIAL);
return XML_TAG_CLOSE;
}
case 305: break;
case 62:
case 63:
{
if(Debug.debugTokenizer)
dump("tag name");//$NON-NLS-1$
yybegin(ST_XML_ATTRIBUTE_NAME);
return XML_TAG_NAME;
}
case 306: break;
case 64:
{
if(Debug.debugTokenizer)
dump("attr name");//$NON-NLS-1$
yybegin(ST_XML_EQUALS);
return XML_TAG_ATTRIBUTE_NAME;
}
case 307: break;
case 65:
{
if(Debug.debugTokenizer)
dump("equals");//$NON-NLS-1$
yybegin(ST_XML_ATTRIBUTE_VALUE);
return XML_TAG_ATTRIBUTE_EQUALS;
}
case 308: break;
case 66:
case 68:
case 69:
case 131:
{
if(Debug.debugTokenizer)
dump("attr value");//$NON-NLS-1$
yybegin(ST_XML_ATTRIBUTE_NAME);
return XML_TAG_ATTRIBUTE_VALUE;
}
case 309: break;
case 71:
{
if(Debug.debugTokenizer)
dump("declaration end");//$NON-NLS-1$
if (Debug.debugTokenizer) {
if(fStateStack.peek()!=YYINITIAL)
System.out.println("end embedded region");//$NON-NLS-1$
}
yybegin(fStateStack.pop());
return XML_DECLARATION_CLOSE;
}
case 310: break;
case 76:
{
if(Debug.debugTokenizer)
dump("doctype type");//$NON-NLS-1$
yybegin(ST_XML_DOCTYPE_EXTERNAL_ID);
return XML_DOCTYPE_NAME;
}
case 311: break;
case 79:
case 81:
case 82:
case 83:
case 147:
case 148:
case 151:
case 152:
case 202:
{
if(Debug.debugTokenizer)
dump("doctype public reference");//$NON-NLS-1$
yybegin(ST_XML_DOCTYPE_ID_SYSTEM);
return XML_DOCTYPE_EXTERNAL_ID_PUBREF;
}
case 312: break;
case 84:
case 86:
case 87:
case 88:
case 159:
{
if(Debug.debugTokenizer)
dump("doctype system reference");//$NON-NLS-1$
yybegin(ST_XML_DECLARATION_CLOSE);
return XML_DOCTYPE_EXTERNAL_ID_SYSREF;
}
case 313: break;
case 89:
case 91:
case 92:
case 165:
case 166:
case 169:
case 170:
case 205:
{
if(Debug.debugTokenizer)
dump("elementdecl name");//$NON-NLS-1$
yybegin(ST_XML_ELEMENT_DECLARATION_CONTENT);
return XML_ELEMENT_DECL_NAME;
}
case 314: break;
case 95:
{
if(Debug.debugTokenizer)
dump("elementdecl close");//$NON-NLS-1$
if (Debug.debugTokenizer) {
if(fStateStack.peek()!=YYINITIAL)
System.out.println("end embedded region");//$NON-NLS-1$
}
yybegin(fStateStack.pop());
return XML_DECLARATION_CLOSE;
}
case 315: break;
case 96:
case 98:
case 99:
case 176:
case 177:
case 180:
case 181:
case 209:
{
if(Debug.debugTokenizer)
dump("attlist name");//$NON-NLS-1$
yybegin(ST_XML_ATTLIST_DECLARATION_CONTENT);
return XML_ATTLIST_DECL_NAME;
}
case 316: break;
case 102:
{
if(Debug.debugTokenizer)
dump("attlist close");//$NON-NLS-1$
if (Debug.debugTokenizer) {
if(fStateStack.peek()!=YYINITIAL)
System.out.println("end embedded region");//$NON-NLS-1$
}
yybegin(fStateStack.pop());
return XML_DECLARATION_CLOSE;
}
case 317: break;
case 105:
{
if(Debug.debugTokenizer)
dump("\nend tag open");//$NON-NLS-1$
yybegin(ST_XML_TAG_NAME);
return XML_END_TAG_OPEN;
}
case 318: break;
case 106:
{
if(Debug.debugTokenizer)
dump("\nprocessing instruction start");//$NON-NLS-1$
yybegin(ST_PI);
return XML_PI_OPEN;
}
case 319: break;
case 107:
{
fStateStack.push(yystate());
if(Debug.debugTokenizer)
dump("\ndeclaration start");//$NON-NLS-1$
yybegin(ST_XML_DECLARATION);
return XML_DECLARATION_OPEN;
}
case 320: break;
case 116:
{
if(Debug.debugTokenizer)
dump("processing instruction end");//$NON-NLS-1$
yybegin(YYINITIAL);
return XML_PI_CLOSE;
}
case 321: break;
case 103:
case 104:
{
return doBlockTagScan();
}
case 322: break;
default:
if (yy_input == YYEOF && yy_startRead == yy_currentPos) {
yy_atEOF = true;
yy_do_eof();
return null;
}
else {
yy_ScanError(YY_NO_MATCH);
}
}
}
}
}