/* The following code was generated by JFlex 1.2.2 on 8/6/16 1:32 PM */ /******************************************************************************* * Copyright (c) 2004, 2016 IBM Corporation and others. * All rights reserved. This program and the accompanying materials * are made available under the terms of the Eclipse Public License v1.0 * which accompanies this distribution, and is available at * http://www.eclipse.org/legal/epl-v10.html * * Contributors: * IBM Corporation - initial API and implementation *******************************************************************************/ package org.eclipse.wst.html.core.internal.parser; import java.io.CharArrayReader; import java.io.IOException; import java.util.ArrayList; import java.util.Iterator; import java.util.List; import org.eclipse.wst.html.core.internal.contenttype.IntStack; import org.eclipse.wst.sse.core.internal.ltk.parser.BlockMarker; import org.eclipse.wst.sse.core.internal.ltk.parser.BlockTokenizer; import org.eclipse.wst.sse.core.internal.provisional.text.ITextRegion; import org.eclipse.wst.sse.core.internal.util.Debug; import org.eclipse.wst.sse.core.utils.StringUtils; import org.eclipse.wst.xml.core.internal.Logger; import org.eclipse.wst.xml.core.internal.parser.regions.XMLParserRegionFactory; import org.eclipse.wst.xml.core.internal.regions.DOMRegionContext; /** * Generate with -skel skeleton.sse */ /** * This class is a scanner generated by * <a href="http://www.informatik.tu-muenchen.de/~kleing/jflex/">JFlex</a> 1.2.2 * on 8/6/16 1:32 PM from the specification file * <tt>file:/Users/nitin/git/webtools.sourceediting/bundles/org.eclipse.wst.sse.core/DevTimeSupport/SedModel/HTMLTokenizer/devel/HTMLTokenizer.jflex</tt> */ public class HTMLTokenizer implements BlockTokenizer, DOMRegionContext { /** this character denotes the end of file */ final public static int YYEOF = -1; /** lexical states */ final public static int ST_XML_DOCTYPE_EXTERNAL_ID = 19; final public static int ST_XML_ELEMENT_DECLARATION_CONTENT = 23; final public static int ST_XML_PI_TAG_CLOSE = 11; final public static int ST_XML_DECLARATION_CLOSE = 17; final public static int ST_XML_PI_ATTRIBUTE_VALUE = 10; final public static int ST_XML_TAG_NAME = 12; final public static int ST_XML_ATTRIBUTE_VALUE = 15; final public static int ST_XML_DOCTYPE_ID_SYSTEM = 21; final public static int ST_XML_ATTRIBUTE_NAME = 13; final public static int ST_XML_ELEMENT_DECLARATION = 22; final public static int ST_XML_DOCTYPE_DECLARATION = 18; final public static int ST_XML_ATTLIST_DECLARATION = 24; final public static int ST_XML_COMMENT_END = 4; final public static int ST_CDATA_TEXT = 1; final public static int ST_XML_COMMENT = 3; final public static int ST_PI_CONTENT = 7; final public static int ST_PI_WS = 6; final public static int ST_CDATA_END = 2; final public static int ST_XML_ATTLIST_DECLARATION_CONTENT = 25; final public static int ST_BLOCK_TAG_SCAN = 26; final public static int ST_XML_PI_EQUALS = 9; final public static int ST_XML_DECLARATION = 16; final public static int YYINITIAL = 0; final public static int ST_XML_DOCTYPE_ID_PUBLIC = 20; final public static int ST_XML_EQUALS = 14; final public static int ST_PI = 5; final public static int ST_XML_PI_ATTRIBUTE_NAME = 8; /** * Translates characters to character classes */ final private static String yycmap_packed = "\11\0\1\5\1\25\2\0\1\20\22\0\1\20\1\24\1\15\1\14"+ "\1\22\1\23\1\16\1\17\1\13\1\13\1\10\1\22\1\22\1\7"+ "\1\6\1\3\12\21\1\10\1\61\1\1\1\46\1\2\1\4\1\22"+ "\1\36\1\62\1\34\1\35\1\51\1\57\1\40\1\40\1\43\1\40"+ "\1\40\1\32\1\30\1\45\1\44\1\50\1\40\1\40\1\56\1\37"+ "\1\60\2\40\1\26\1\47\1\40\1\11\1\0\1\12\1\0\1\10"+ "\1\0\1\53\1\62\1\63\1\54\1\41\1\57\1\40\1\66\1\43"+ "\2\40\1\33\1\31\1\45\1\44\1\50\1\40\1\40\1\42\1\52"+ "\1\60\1\40\1\40\1\27\1\55\1\40\1\0\1\0\72\0\1\65"+ "\10\0\27\64\1\0\37\64\1\0\72\64\2\0\13\64\2\0\10\64"+ "\1\0\65\64\1\0\104\64\11\0\44\64\3\0\2\64\4\0\36\64"+ "\70\0\131\64\22\0\7\64\16\0\2\65\56\0\106\65\32\0\2\65"+ "\44\0\1\64\1\65\3\64\1\0\1\64\1\0\24\64\1\0\54\64"+ "\1\0\7\64\3\0\1\64\1\0\1\64\1\0\1\64\1\0\1\64"+ "\1\0\22\64\15\0\14\64\1\0\102\64\1\0\14\64\1\0\44\64"+ "\1\0\4\65\11\0\65\64\2\0\2\64\2\0\2\64\3\0\34\64"+ "\2\0\10\64\2\0\2\64\67\0\46\64\2\0\1\64\7\0\46\64"+ "\12\0\21\65\1\0\27\65\1\0\3\65\1\0\1\65\1\0\2\65"+ "\1\0\1\65\13\0\33\64\5\0\3\64\56\0\32\64\5\0\1\65"+ "\12\64\10\65\15\0\12\65\6\0\1\65\107\64\2\0\5\64\1\0"+ "\17\64\1\0\4\64\1\0\1\64\17\65\2\64\2\65\1\0\4\65"+ "\2\0\12\65\u0207\0\3\65\1\0\65\64\2\0\1\65\1\64\20\65"+ "\3\0\4\65\3\0\12\64\2\65\2\0\12\65\21\0\3\65\1\0"+ "\10\64\2\0\2\64\2\0\26\64\1\0\7\64\1\0\1\64\3\0"+ "\4\64\2\0\1\65\1\0\7\65\2\0\2\65\2\0\3\65\11\0"+ "\1\65\4\0\2\64\1\0\3\64\2\65\2\0\12\65\2\64\20\0"+ "\1\65\2\0\6\64\4\0\2\64\2\0\26\64\1\0\7\64\1\0"+ "\2\64\1\0\2\64\1\0\2\64\2\0\1\65\1\0\5\65\4\0"+ "\2\65\2\0\3\65\13\0\4\64\1\0\1\64\7\0\12\65\2\65"+ "\3\64\14\0\3\65\1\0\7\64\1\0\1\64\1\0\3\64\1\0"+ "\26\64\1\0\7\64\1\0\2\64\1\0\5\64\2\0\1\65\1\64"+ "\10\65\1\0\3\65\1\0\3\65\22\0\1\64\5\0\12\65\21\0"+ "\3\65\1\0\10\64\2\0\2\64\2\0\26\64\1\0\7\64\1\0"+ "\2\64\2\0\4\64\2\0\1\65\1\64\6\65\3\0\2\65\2\0"+ "\3\65\10\0\2\65\4\0\2\64\1\0\3\64\4\0\12\65\22\0"+ "\2\65\1\0\6\64\3\0\3\64\1\0\4\64\3\0\2\64\1\0"+ "\1\64\1\0\2\64\3\0\2\64\3\0\3\64\3\0\10\64\1\0"+ "\3\64\4\0\5\65\3\0\3\65\1\0\4\65\11\0\1\65\17\0"+ "\11\65\21\0\3\65\1\0\10\64\1\0\3\64\1\0\27\64\1\0"+ "\12\64\1\0\5\64\4\0\7\65\1\0\3\65\1\0\4\65\7\0"+ "\2\65\11\0\2\64\4\0\12\65\22\0\2\65\1\0\10\64\1\0"+ "\3\64\1\0\27\64\1\0\12\64\1\0\5\64\4\0\7\65\1\0"+ "\3\65\1\0\4\65\7\0\2\65\7\0\1\64\1\0\2\64\4\0"+ "\12\65\22\0\2\65\1\0\10\64\1\0\3\64\1\0\27\64\1\0"+ "\20\64\4\0\6\65\2\0\3\65\1\0\4\65\11\0\1\65\10\0"+ "\2\64\4\0\12\65\221\0\56\64\1\0\1\64\1\65\2\64\7\65"+ "\5\0\6\64\1\65\10\65\1\0\12\65\47\0\2\64\1\0\1\64"+ "\2\0\2\64\1\0\1\64\2\0\1\64\6\0\4\64\1\0\7\64"+ "\1\0\3\64\1\0\1\64\1\0\1\64\2\0\2\64\1\0\2\64"+ "\1\0\1\64\1\65\2\64\6\65\1\0\2\65\1\64\2\0\5\64"+ "\1\0\1\65\1\0\6\65\2\0\12\65\76\0\2\65\6\0\12\65"+ "\13\0\1\65\1\0\1\65\1\0\1\65\4\0\2\65\10\64\1\0"+ "\41\64\7\0\24\65\1\0\6\65\4\0\6\65\1\0\1\65\1\0"+ "\25\65\3\0\7\65\1\0\1\65\346\0\46\64\12\0\47\64\11\0"+ "\1\64\1\0\2\64\1\0\3\64\1\0\1\64\1\0\2\64\1\0"+ "\5\64\51\0\1\64\1\0\1\64\1\0\1\64\13\0\1\64\1\0"+ "\1\64\1\0\1\64\3\0\2\64\3\0\1\64\5\0\3\64\1\0"+ "\1\64\1\0\1\64\1\0\1\64\1\0\1\64\3\0\2\64\3\0"+ "\2\64\1\0\1\64\50\0\1\64\11\0\1\64\2\0\1\64\2\0"+ "\2\64\7\0\2\64\1\0\1\64\1\0\7\64\50\0\1\64\4\0"+ "\1\64\10\0\1\64\u0c06\0\234\64\4\0\132\64\6\0\26\64\2\0"+ "\6\64\2\0\46\64\2\0\6\64\2\0\10\64\1\0\1\64\1\0"+ "\1\64\1\0\1\64\1\0\37\64\2\0\65\64\1\0\7\64\1\0"+ "\1\64\3\0\3\64\1\0\7\64\3\0\4\64\2\0\6\64\4\0"+ "\15\64\5\0\3\64\1\0\7\64\323\0\15\65\4\0\1\65\104\0"+ "\1\64\3\0\2\64\2\0\1\64\121\0\3\64\u0e82\0\1\65\1\0"+ "\1\64\31\0\11\64\6\65\1\0\5\65\13\0\124\64\4\0\2\65"+ "\2\0\2\65\2\0\132\64\1\0\3\65\6\0\50\64\u1cd3\0\u51a6\64"+ "\u0c5a\0\u2ba4\64\134\0\u0800\0\u1ffe\0\2\0"; /** * Translates characters to character classes */ final private static char [] yycmap = yy_unpack_cmap(yycmap_packed); /** * Translates a state to a row index in the transition table */ final private static int yy_rowMap [] = { 0, 55, 110, 165, 220, 275, 330, 385, 440, 495, 550, 605, 660, 715, 770, 825, 880, 935, 990, 1045, 1100, 1155, 1210, 1265, 1320, 1375, 1430, 1485, 1540, 1595, 1650, 1705, 1760, 1705, 1760, 1815, 1705, 1705, 1760, 1870, 1925, 1980, 2035, 2090, 2145, 2200, 1705, 1760, 2255, 2310, 2365, 1705, 2420, 2420, 2475, 2530, 2585, 2255, 2640, 2695, 1705, 2750, 2805, 2860, 2915, 1705, 2970, 3025, 3080, 3135, 3190, 1705, 3245, 3300, 3355, 3410, 3465, 3520, 3575, 3630, 3630, 3685, 3740, 3795, 3850, 3850, 3905, 3960, 4015, 4070, 4070, 4125, 4180, 4235, 4290, 1705, 4345, 4345, 4400, 4455, 4510, 4565, 1705, 1705, 1760, 1705, 1705, 4620, 4675, 4730, 4785, 4840, 4895, 4950, 5005, 5060, 1705, 5115, 5170, 1705, 1705, 2420, 5225, 2530, 1705, 5280, 2585, 1705, 2970, 5335, 3080, 1705, 5390, 3135, 4620, 5445, 5500, 5555, 3410, 1705, 5610, 5665, 3630, 3685, 3630, 5720, 3740, 1705, 5775, 5830, 5885, 5885, 5940, 5995, 3850, 3905, 3850, 6050, 3960, 1705, 6105, 4015, 4070, 6160, 4125, 1705, 6215, 6270, 6325, 6325, 6380, 6435, 6490, 4345, 6545, 4400, 1705, 6600, 6655, 6710, 6710, 6765, 6820, 6875, 6930, 6985, 7040, 7095, 1705, 7150, 7205, 1705, 1705, 1705, 2035, 7260, 7315, 7370, 7425, 7480, 7535, 5775, 7590, 7590, 6215, 7645, 7645, 7700, 6600, 7755, 7755, 7810, 1705, 7865, 7920, 7975, 1705, 8030, 8085, 8140, 8195, 8250, 8305, 8360, 5940, 6380, 8415, 6765, 8470, 8525, 8580, 1705, 8635, 8690, 8745, 8800, 8855, 8910, 8965, 9020, 9075, 9130, 9185, 9240, 9295, 1705, 1705, 9350, 9405, 9460, 9515, 1705, 1705, 1705, 9570, 9625, 9680, 9735, 9790, 9845, 1705, 9900, 4235, 4510, 9955, 10010, 10065, 10120, 2035 }; /** * The packed transition table of the DFA */ final private static String yy_packed = "\1\34\1\35\14\34\1\36\4\34\1\37\43\34\1\40"+ "\1\41\65\40\1\42\1\43\10\42\1\44\12\42\1\45"+ "\41\42\1\46\1\47\65\46\1\42\1\43\5\42\1\50"+ "\15\42\1\45\42\42\1\43\2\42\1\51\1\52\2\42"+ "\1\53\3\42\1\53\3\42\1\52\4\42\1\52\1\54"+ "\1\55\16\53\1\42\12\53\1\42\3\53\1\42\1\53"+ "\1\42\1\43\2\42\1\51\1\56\12\42\1\56\4\42"+ "\1\56\41\42\1\57\1\60\2\57\1\61\20\57\1\45"+ "\41\57\1\42\1\43\2\42\1\62\1\52\2\42\1\63"+ "\3\42\1\63\3\42\1\52\4\42\1\52\20\63\1\42"+ "\12\63\1\42\3\63\1\42\1\63\1\42\1\43\2\42"+ "\1\62\1\52\2\42\1\63\3\42\1\63\3\42\1\52"+ "\4\42\1\52\20\63\1\64\12\63\1\42\3\63\1\42"+ "\1\63\1\65\1\43\1\42\1\66\1\67\1\52\7\65"+ "\1\70\1\65\1\71\1\52\4\65\1\52\41\65\1\42"+ "\1\43\2\42\1\72\20\42\1\45\41\42\1\73\1\74"+ "\1\75\1\76\4\73\1\77\3\73\1\77\11\73\20\100"+ "\1\73\12\100\1\73\3\100\1\73\1\100\1\42\1\74"+ "\1\75\1\76\1\42\1\52\2\42\5\101\3\42\1\52"+ "\4\42\1\52\20\101\1\42\12\101\1\42\3\101\1\42"+ "\1\101\1\42\1\74\1\75\1\76\1\42\1\52\2\42"+ "\5\101\3\42\1\52\4\42\1\52\20\101\1\102\12\101"+ "\1\42\3\101\1\42\1\101\1\103\1\74\1\75\1\104"+ "\1\103\1\52\7\103\1\105\1\103\1\106\1\52\4\103"+ "\1\52\41\103\1\42\1\107\1\110\2\42\1\52\12\42"+ "\1\52\4\42\1\52\7\42\1\111\1\112\2\42\1\113"+ "\7\42\1\113\1\42\1\112\1\111\13\42\1\43\1\110"+ "\2\42\1\52\3\42\1\114\6\42\1\52\4\42\1\52"+ "\42\42\1\43\1\110\2\42\1\52\2\42\1\115\1\114"+ "\2\42\1\115\3\42\1\52\4\42\1\52\20\115\1\42"+ "\12\115\1\42\3\115\1\42\1\115\1\42\1\43\1\110"+ "\2\42\1\52\3\42\1\114\6\42\1\52\4\42\1\52"+ "\14\42\1\116\5\42\1\117\5\42\1\116\10\42\1\120"+ "\1\43\1\110\1\121\1\120\1\52\3\120\1\122\3\120"+ "\1\123\1\120\1\124\1\52\4\120\1\52\41\120\1\125"+ "\1\43\1\110\1\126\1\125\1\52\3\125\1\127\3\125"+ "\1\130\1\125\1\131\1\52\4\125\1\52\41\125\1\132"+ "\1\43\1\110\1\133\1\132\1\52\7\132\1\134\1\132"+ "\1\135\1\52\4\132\1\52\41\132\1\136\1\137\1\140"+ "\64\136\1\141\1\43\1\110\1\142\1\141\1\52\7\141"+ "\1\143\1\141\1\144\1\52\4\141\1\52\41\141\1\145"+ "\1\146\1\147\64\145\1\150\1\151\65\150\1\34\1\0"+ "\14\34\1\0\4\34\1\0\43\34\3\0\1\152\1\153"+ "\17\0\1\154\47\0\1\155\2\0\1\156\3\0\1\157"+ "\3\0\1\155\4\0\1\155\20\156\1\0\12\156\1\0"+ "\3\156\1\0\1\156\5\0\1\155\2\0\1\160\3\0"+ "\1\160\3\0\1\155\2\0\1\161\1\0\1\155\20\160"+ "\1\0\12\160\1\0\3\160\1\0\1\160\113\0\1\162"+ "\54\0\1\163\63\0\1\164\61\0\1\165\71\0\1\52"+ "\12\0\1\52\4\0\1\52\47\0\7\53\4\0\1\53"+ "\4\0\20\53\1\0\12\53\1\0\5\53\6\0\7\53"+ "\4\0\1\53\4\0\2\53\2\166\14\53\1\0\12\53"+ "\1\0\5\53\6\0\7\53\4\0\1\53\4\0\2\53"+ "\1\166\1\167\14\53\1\0\12\53\1\0\5\53\5\0"+ "\1\56\12\0\1\56\4\0\1\56\43\0\1\170\66\0"+ "\1\171\72\0\7\63\4\0\1\63\4\0\20\63\1\0"+ "\12\63\1\0\5\63\1\65\2\0\1\172\1\65\1\0"+ "\7\65\1\0\1\65\2\0\4\65\1\0\42\65\1\0"+ "\1\171\1\172\1\65\1\0\7\65\1\0\1\65\2\0"+ "\4\65\1\0\41\65\1\70\2\173\1\174\1\70\1\173"+ "\7\70\1\175\1\70\2\173\4\70\1\173\41\70\1\71"+ "\2\176\1\177\1\71\1\176\7\71\1\176\1\71\1\175"+ "\1\176\4\71\1\176\41\71\1\73\3\0\22\73\20\0"+ "\1\73\12\0\1\73\3\0\1\73\4\0\1\152\20\0"+ "\1\154\44\0\1\200\64\0\1\73\3\0\2\73\7\77"+ "\4\73\1\77\4\73\20\100\1\73\12\100\1\73\3\100"+ "\1\77\1\100\6\0\7\100\4\0\1\100\4\0\20\100"+ "\1\0\12\100\1\0\5\100\6\0\7\101\4\0\1\101"+ "\4\0\20\101\1\0\12\101\1\0\5\101\1\103\2\0"+ "\1\201\1\103\1\0\7\103\1\0\1\103\2\0\4\103"+ "\1\0\42\103\1\0\1\200\1\201\1\103\1\0\7\103"+ "\1\0\1\103\2\0\4\103\1\0\41\103\1\105\2\202"+ "\1\203\1\105\1\202\7\105\1\204\1\105\2\202\4\105"+ "\1\202\41\105\1\106\2\205\1\206\1\106\1\205\7\106"+ "\1\205\1\106\1\204\1\205\4\106\1\205\41\106\3\0"+ "\1\152\20\0\1\207\106\0\1\210\61\0\1\211\12\0"+ "\1\211\46\0\2\212\33\0\12\213\1\214\54\213\6\0"+ "\7\115\4\0\1\115\4\0\20\115\1\0\12\115\1\0"+ "\5\115\47\0\1\215\5\0\1\215\71\0\1\216\6\0"+ "\1\120\2\0\1\217\1\120\1\0\7\120\1\0\1\120"+ "\2\0\4\120\1\0\41\120\1\122\2\213\1\220\1\122"+ "\1\213\4\122\1\221\2\122\1\213\1\122\2\213\4\122"+ "\1\213\41\122\1\123\2\222\1\223\1\123\1\222\7\123"+ "\1\224\1\123\2\222\4\123\1\222\41\123\1\225\2\226"+ "\1\227\1\230\1\226\3\230\2\225\2\230\1\226\1\225"+ "\1\231\1\232\4\230\1\232\36\230\2\225\1\230\1\125"+ "\2\0\1\233\1\125\1\0\7\125\1\0\1\125\2\0"+ "\4\125\1\0\41\125\1\127\2\213\1\234\1\127\1\213"+ "\4\127\1\235\2\127\1\213\1\127\2\213\4\127\1\213"+ "\41\127\1\130\2\236\1\237\1\130\1\236\7\130\1\240"+ "\1\130\2\236\4\130\1\236\41\130\1\131\2\241\1\242"+ "\1\131\1\241\7\131\1\241\1\131\1\240\1\241\4\131"+ "\1\241\41\131\1\132\2\0\1\243\1\132\1\0\7\132"+ "\1\0\1\132\2\0\4\132\1\0\41\132\1\134\2\244"+ "\1\245\1\134\1\244\7\134\1\246\1\134\2\244\4\134"+ "\1\244\41\134\1\247\2\250\1\251\1\252\1\250\3\252"+ "\2\247\2\252\1\250\1\247\1\253\1\254\4\252\1\254"+ "\36\252\2\247\1\252\2\136\1\0\66\136\1\0\21\136"+ "\1\255\42\136\1\141\2\0\1\256\1\141\1\0\7\141"+ "\1\0\1\141\2\0\4\141\1\0\41\141\1\143\2\257"+ "\1\260\1\143\1\257\7\143\1\261\1\143\2\257\4\143"+ "\1\257\41\143\1\262\2\263\1\264\1\265\1\263\3\265"+ "\2\262\2\265\1\263\1\262\1\266\1\267\4\265\1\267"+ "\36\265\2\262\1\265\2\145\1\0\66\145\1\0\21\145"+ "\1\270\42\145\7\0\1\271\1\0\1\272\62\0\1\155"+ "\2\0\1\34\3\0\1\34\3\0\1\155\4\0\1\155"+ "\20\34\1\0\12\34\1\0\3\34\1\0\1\34\1\273"+ "\1\0\3\273\1\274\7\156\1\273\1\0\1\273\1\274"+ "\1\156\1\273\1\0\1\273\1\274\20\156\1\273\12\156"+ "\1\275\5\156\1\273\1\0\3\273\1\274\7\156\1\273"+ "\1\0\1\273\1\274\1\276\1\273\1\0\1\273\1\274"+ "\1\156\1\277\16\156\1\273\12\156\1\275\5\156\1\273"+ "\1\0\3\273\1\274\7\160\1\273\1\0\1\273\1\274"+ "\1\160\1\273\1\0\1\273\1\274\20\160\1\273\12\160"+ "\1\300\5\160\23\0\1\161\54\0\1\272\57\0\1\301"+ "\66\0\1\302\72\0\7\53\4\0\1\53\4\0\4\53"+ "\2\303\12\53\1\0\12\53\1\0\5\53\6\0\7\53"+ "\4\0\1\53\4\0\4\53\1\303\1\304\12\53\1\0"+ "\12\53\1\0\5\53\15\173\1\175\51\173\17\176\1\175"+ "\47\176\15\202\1\204\51\202\17\205\1\204\47\205\34\0"+ "\1\305\26\0\1\305\42\0\1\306\12\0\1\306\55\0"+ "\1\307\7\0\1\307\57\0\1\310\13\0\1\310\72\0"+ "\1\311\4\0\15\222\1\224\51\222\1\225\2\226\1\312"+ "\1\225\1\226\7\225\1\226\1\225\1\224\1\226\4\225"+ "\1\226\41\225\17\226\1\224\47\226\1\225\2\226\1\312"+ "\1\225\1\226\7\225\1\226\1\225\1\313\1\226\4\225"+ "\1\226\41\225\17\0\1\314\47\0\17\226\1\313\47\226"+ "\15\236\1\240\51\236\17\241\1\240\47\241\15\244\1\246"+ "\51\244\1\247\2\250\1\315\1\247\1\250\7\247\1\250"+ "\1\247\1\246\1\250\4\247\1\250\41\247\17\250\1\246"+ "\47\250\1\247\2\250\1\315\1\247\1\250\7\247\1\250"+ "\1\247\1\316\1\250\4\247\1\250\41\247\17\0\1\317"+ "\47\0\17\250\1\316\47\250\2\136\1\0\6\136\1\320"+ "\55\136\15\257\1\261\51\257\1\262\2\263\1\321\1\262"+ "\1\263\7\262\1\263\1\262\1\261\1\263\4\262\1\263"+ "\41\262\17\263\1\261\47\263\1\262\2\263\1\321\1\262"+ "\1\263\7\262\1\263\1\262\1\322\1\263\4\262\1\263"+ "\41\262\17\0\1\323\47\0\17\263\1\322\47\263\2\145"+ "\1\0\6\145\1\324\55\145\7\0\1\325\113\0\1\326"+ "\32\0\1\273\1\0\14\273\1\0\4\273\1\0\35\273"+ "\1\0\6\273\1\0\3\273\1\274\2\273\1\327\3\273"+ "\1\327\1\273\1\0\1\273\1\274\2\273\1\0\1\273"+ "\1\274\20\327\1\273\12\327\1\330\3\327\1\273\1\327"+ "\1\273\1\0\3\273\1\274\7\156\1\273\1\0\1\273"+ "\1\274\1\276\1\273\1\0\1\273\1\274\20\156\1\273"+ "\12\156\1\331\5\156\1\273\1\0\3\273\1\274\7\156"+ "\1\273\1\0\1\273\1\274\1\332\1\273\1\0\1\273"+ "\1\274\6\156\3\332\2\156\1\332\4\156\1\273\2\156"+ "\1\332\1\156\2\332\2\156\1\332\1\156\1\275\2\332"+ "\3\156\6\0\1\53\1\333\5\53\4\0\1\53\4\0"+ "\20\53\1\0\12\53\1\0\5\53\37\0\1\334\12\0"+ "\1\334\46\0\2\335\63\0\2\336\74\0\1\337\12\0"+ "\1\337\46\0\2\340\36\0\2\341\1\0\3\341\2\0"+ "\2\341\2\0\1\231\44\341\2\0\1\341\3\0\2\342"+ "\1\0\3\342\2\0\2\342\2\0\1\253\44\342\2\0"+ "\1\342\2\136\1\0\31\136\1\343\32\136\3\0\2\344"+ "\1\0\3\344\2\0\2\344\2\0\1\266\44\344\2\0"+ "\1\344\2\145\1\0\31\145\1\345\32\145\35\0\1\346"+ "\31\0\1\273\1\0\3\273\1\347\7\327\1\273\1\0"+ "\1\273\1\347\1\327\1\273\1\0\1\273\1\347\20\327"+ "\1\273\12\327\1\350\5\327\61\0\1\330\5\0\1\273"+ "\1\0\3\273\1\274\7\156\1\273\1\0\1\273\1\274"+ "\1\332\1\273\1\0\1\273\1\274\6\156\3\332\2\156"+ "\1\332\4\156\1\273\2\156\1\332\1\156\2\332\2\156"+ "\1\332\1\156\1\331\2\332\3\156\6\0\7\53\4\0"+ "\1\53\4\0\14\53\1\351\3\53\1\0\12\53\1\0"+ "\5\53\47\0\1\352\5\0\1\352\54\0\1\353\64\0"+ "\1\354\7\0\1\354\56\0\1\355\7\0\1\355\60\0"+ "\1\356\23\0\2\136\1\0\32\136\1\357\31\136\2\145"+ "\1\0\32\145\1\360\31\145\36\0\1\361\30\0\1\273"+ "\1\0\3\273\1\347\2\273\1\327\3\273\1\327\1\273"+ "\1\0\1\273\1\347\2\273\1\0\1\273\1\347\20\327"+ "\1\273\12\327\1\0\3\327\1\273\1\327\6\0\7\53"+ "\4\0\1\53\4\0\20\53\1\0\3\53\1\362\6\53"+ "\1\0\5\53\50\0\1\363\60\0\1\364\13\0\1\364"+ "\55\0\1\365\51\0\2\366\71\0\1\367\26\0\1\367"+ "\3\0\2\136\1\0\33\136\1\370\30\136\2\145\1\0"+ "\33\145\1\371\30\145\37\0\1\372\35\0\7\53\4\0"+ "\1\53\4\0\20\53\1\0\6\53\1\373\3\53\1\0"+ "\5\53\41\0\1\374\7\0\1\374\54\0\1\375\12\0"+ "\1\375\53\0\1\376\12\0\1\376\14\0\2\136\1\0"+ "\34\136\1\377\27\136\2\145\1\0\34\145\1\u0100\27\145"+ "\36\0\1\u0101\36\0\7\53\4\0\1\53\4\0\5\53"+ "\1\u0102\12\53\1\0\12\53\1\0\5\53\2\136\1\0"+ "\33\136\1\u0103\30\136\2\145\1\0\33\145\1\u0104\30\145"+ "\11\0\1\u0105\63\0\7\53\4\0\1\53\4\0\13\53"+ "\1\u0106\4\53\1\0\12\53\1\0\5\53\2\136\1\0"+ "\6\136\1\u0107\55\136\2\145\1\0\6\145\1\u0108\55\145"+ "\6\0\7\53\4\0\1\53\4\0\14\53\1\u0109\3\53"+ "\1\0\12\53\1\0\5\53\6\0\7\53\4\0\1\53"+ "\4\0\20\53\1\0\12\53\1\0\4\53\1\u010a\6\0"+ "\7\53\4\0\1\53\4\0\13\53\1\u010b\4\53\1\0"+ "\12\53\1\0\5\53\6\0\7\53\4\0\1\53\4\0"+ "\13\53\1\u010c\4\53\1\0\12\53\1\0\5\53\6\0"+ "\7\53\4\0\1\53\4\0\20\53\1\0\3\53\1\u010d"+ "\6\53\1\0\5\53"; /** * The transition table of the DFA */ final private static int yytrans [] = yy_unpack(yy_packed); /* error codes */ final private static int YY_UNKNOWN_ERROR = 0; // final private static int YY_ILLEGAL_STATE = 1; final private static int YY_NO_MATCH = 2; final private static int YY_PUSHBACK_2BIG = 3; /* error messages for the codes above */ final private static String YY_ERROR_MSG[] = { "Unkown internal scanner error", //$NON-NLS-1$ "Internal error: unknown state", //$NON-NLS-1$ "Error: could not match input", //$NON-NLS-1$ "Error: pushback value was too large" //$NON-NLS-1$ }; /** * YY_ATTRIBUTE[aState] contains the attributes of state <code>aState</code> */ private final static byte YY_ATTRIBUTE[] = { 1, 0, 0, 0, 0, 1, 0, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 0, 1, 1, 1, 1, 9, 1, 9, 1, 1, 9, 9, 1, 1, 1, 1, 1, 1, 1, 1, 9, 1, 1, 1, 1, 9, 1, 1, 1, 1, 1, 1, 1, 1, 9, 1, 1, 1, 1, 9, 1, 1, 1, 1, 1, 9, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 1, 9, 1, 1, 1, 1, 1, 1, 9, 9, 1, 9, 9, 1, 0, 1, 1, 1, 1, 0, 0, 0, 9, 1, 1, 9, 9, 0, 0, 0, 9, 0, 0, 9, 0, 0, 0, 9, 0, 0, 0, 0, 0, 0, 0, 9, 0, 0, 0, 0, 1, 0, 0, 9, 1, 0, 0, 1, 1, 0, 0, 0, 1, 0, 0, 9, 0, 0, 0, 0, 0, 9, 1, 0, 0, 1, 1, 0, 1, 0, 0, 0, 9, 1, 0, 0, 1, 1, 0, 1, 0, 0, 1, 1, 9, 1, 1, 9, 9, 9, 1, 1, 0, 0, 0, 0, 0, 0, 1, 0, 0, 1, 0, 1, 0, 1, 0, 1, 9, 0, 1, 1, 9, 1, 1, 0, 0, 0, 0, 0, 0, 0, 1, 0, 1, 0, 1, 9, 1, 0, 0, 0, 0, 0, 1, 1, 0, 1, 0, 0, 0, 9, 9, 1, 1, 0, 1, 9, 9, 9, 1, 1, 0, 1, 1, 1, 9, 1, 1, 1, 1, 1, 1, 1, 1 }; /** the input device */ private java.io.Reader yy_reader; /** the current state of the DFA */ private int yy_state; /** the current lexical state */ private int yy_lexical_state = YYINITIAL; /** this buffer contains the current text to be matched and is the source of the yytext() string */ private char yy_buffer[] = new char[16384]; /** the textposition at the last accepting state */ private int yy_markedPos; /** the current text position in the buffer */ private int yy_currentPos; /** startRead marks the beginning of the yytext() string in the buffer */ private int yy_startRead; /** endRead marks the last character in the buffer, that has been read from input */ private int yy_endRead; /** number of newlines encountered up to the start of the matched text */ // private int yyline; /** the number of characters up to the start of the matched text */ private int yychar; /** * the number of characters from the last newline up to the start of the * matched text */ // private int yycolumn; /** * yy_atBOL == true <=> the scanner is currently at the beginning of a line */ // private boolean yy_atBOL; /** yy_atEOF == true <=> the scanner has returned a value for EOF */ private boolean yy_atEOF; /** denotes if the user-EOF-code has already been executed */ private boolean yy_eof_done; /* user code: */ private int fTokenCount = 0; // required holders for white-space compacting private boolean fShouldLoadBuffered = false; private String fBufferedContext = null; private int fBufferedStart = 1; private int fBufferedLength = 0; private String f_context = null; // state stack for handling embedded regions private IntStack fStateStack = new IntStack(); private String context = null; private int start = 0; private int textLength = 0; private int length = 0; // offset for tracking position specific block tags private int fOffset = 0; // the name of the current tag being opened private String fCurrentTagName = null; // the list of tag name BlockMarkers private List fBlockMarkers = new ArrayList(); // required to not seek text blocks on an end tag private boolean fIsBlockingEnabled = false; private boolean fIsCaseSensitiveBlocking = true; private XMLParserRegionFactory fRegionFactory = new XMLParserRegionFactory(); /** * user method */ public final void addBlockMarker(BlockMarker marker) { if(containsTagName(marker.getTagName())) return; fBlockMarkers.add(marker); } /** * user method */ public final void removeBlockMarker(BlockMarker marker) { fBlockMarkers.remove(marker); } /** * user method */ public final void removeBlockMarker(String tagname) { if (fBlockMarkers != null) { Iterator blocks = fBlockMarkers.iterator(); while (blocks.hasNext()) { if (((BlockMarker) blocks.next()).getTagName().equals(tagname)) blocks.remove(); } } } /* user method */ public final boolean isCaseSensitiveBlocking() { return fIsCaseSensitiveBlocking; } /* user method */ public final void setCaseSensitiveBlocking(boolean newValue) { fIsCaseSensitiveBlocking = newValue; } /* user method */ public boolean getBlockMarkerCaseSensitivity() { return getBlockMarkerCaseSensitivity(fCurrentTagName); } /* user method */ public boolean getBlockMarkerCaseSensitivity(String name) { Iterator iterator = fBlockMarkers.iterator(); while(iterator.hasNext()) { BlockMarker marker = (BlockMarker)iterator.next(); boolean casesensitive = marker.isCaseSensitive(); if(casesensitive && marker.getTagName().equals(name)) return casesensitive; else if(!casesensitive && marker.getTagName().equalsIgnoreCase(name)) return casesensitive; } return true; } /* user method */ public String getBlockMarkerContext() { return getBlockMarkerContext(fCurrentTagName); } /* user method */ public String getBlockMarkerContext(String name) { Iterator iterator = fBlockMarkers.iterator(); while(iterator.hasNext()) { BlockMarker marker = (BlockMarker)iterator.next(); if(marker.getTagName().equals(name)) return marker.getContext(); } return BLOCK_TEXT; } /* user method */ public List getBlockMarkers() { return fBlockMarkers; } /* user method */ public final int getOffset() { return fOffset + yychar; } private final boolean isBlockMarker() { return isBlockMarker(fCurrentTagName); } private final boolean isBlockMarker(String tagName) { if (!fIsBlockingEnabled) return false; return containsTagName(tagName); } /** * user method */ public final void beginBlockTagScan(String newTagName) { beginBlockMarkerScan(newTagName, BLOCK_TEXT); } /** * user method * * Special tokenizer setup. Allows tokenization to be initiated at the * start of a text block within a "newTagName" tag. * * Example: * Tokenizer toker = new Tokenizer(); * toker.setCaseSensitiveBlocking(false); * toker.reset(new java.io.StringReader("afiuhqwkejhtasihgalkwhtq</scripter></scr></script>asgdasga")); * toker.beginBlockMarkerScan("script", BLOCK_TEXT); * toker.getRegions(); * * Returns: * BLOCK_TEXT: 0-40 * XML_END_TAG_OPEN: 41-42 * XML_TAG_NAME: 43-48 * XML_TAG_CLOSE: 49-49 * XML_CONTENT: 50-57 * */ public final void beginBlockMarkerScan(String newTagName, String blockcontext) { yybegin(ST_BLOCK_TAG_SCAN); fCurrentTagName = newTagName; } /** * Method doScan. * * Returns a context region for all of the text from the current position upto the end of input or * to right *before* the first occurence of searchString * * @param searchString - target string to search for ex.: "-->", "</tagname" * @param requireTailSeparator - whether the target must be immediately followed by whitespace or '>' * @param context - the context of the scanned region if non-zero length * @param exitState - the state to go to if the region was of non-zero length * @param abortState - the state to go to if the searchString was found immediately * @return String - the context found: the desired context on a non-zero length match, the abortContext on immediate success * @throws IOException */ private final String doScan(String searchString, boolean requireTailSeparator, String searchContext, int exitState, int immediateFallbackState) throws IOException { boolean stillSearching = true; // Disable further block (probably) fIsBlockingEnabled = false; int searchStringLength = searchString.length(); int n = 0; char lastCheckChar; int i; boolean same = false; while (stillSearching) { n = 0; // Ensure that enough data from the input exists to compare against the search String. n = yy_advance(); while(n != YYEOF && yy_currentPos < searchStringLength) n = yy_advance(); // If the input was too short or we've exhausted the input, stop immediately. if (n == YYEOF) { stillSearching = false; } else { same = true; // Ensure that we've not encountered a complete block (<%%>) that was *shorter* than the closeTagString and // thus found twice at current-targetLength [since the first scan would have come out this far anyway]. // Check the characters in the target versus the last targetLength characters read from the buffer // and see if it matches // safety check for array accesses (yy_currentPos is the *last* character we can check against) if(yy_currentPos >= searchStringLength && yy_currentPos <= yy_buffer.length) { for(i = 0; i < searchStringLength; i++) { if(same && fIsCaseSensitiveBlocking) same = yy_buffer[i + yy_currentPos - searchStringLength] == searchString.charAt(i); else if(same && !fIsCaseSensitiveBlocking) same = Character.toLowerCase(yy_buffer[i + yy_currentPos - searchStringLength]) == Character.toLowerCase(searchString.charAt(i)); } } // safety check failed; no match is possible right now else { same = false; } if (same && requireTailSeparator && yy_currentPos < yy_buffer.length) { // Additional check for close tags to ensure that targetString="</script" doesn't match // "</scriptS" lastCheckChar = yy_buffer[yy_currentPos]; // Succeed on "</script>" and "</script " if(lastCheckChar == '>' || Character.isWhitespace(lastCheckChar)) stillSearching = false; } else { stillSearching = !same || (yy_currentPos < yy_startRead + searchStringLength); } } } if (n != YYEOF || same) { // We've stopped short of the end or definitely found a match yy_markedPos = yy_currentPos - searchStringLength; yy_currentPos = yy_markedPos + 1; // If the searchString occurs at the very beginning of what would have // been a Block, resume scanning normally immediately if (yy_markedPos == yy_startRead) { yybegin(immediateFallbackState); return primGetNextToken(); } } else { // We ran through the rest of the input yy_markedPos = yy_currentPos; yy_currentPos++; } yybegin(exitState); // If the ending occurs at the very beginning of what would have // been a Block, resume scanning normally immediately if(yy_markedPos == yy_startRead) return primGetNextToken(); return searchContext; } /** * user method * * A generic lookahead-like operation */ private final String doBlockScan(String target, String targetContext, int immediateFallbackState) throws IOException { return doScan(target, false, targetContext, immediateFallbackState, immediateFallbackState); } /** * user method * does a lookahead for the current tag name */ private final String doBlockTagScan() throws IOException { fIsCaseSensitiveBlocking = getBlockMarkerCaseSensitivity(); return doScan("</" + fCurrentTagName, true, getBlockMarkerContext(fCurrentTagName), YYINITIAL, YYINITIAL); } /** * user method * * Converts the raw context String returned by the primGetNextToken() * method into a full ITextRegion by pulling in values for the * current offset within the scanning text. * * Returns null when EOF is encountered and attaches intermittently * discovered whitespace onto the end of useful regions. * * Note that this algorithm caches the token following the one being returned * so that whitespace can be collapsed. */ public final ITextRegion getNextToken() throws IOException { // load the starting non-whitespace token (assume that it is so) if (fShouldLoadBuffered) { context = fBufferedContext; start = fBufferedStart; textLength = length = fBufferedLength; fShouldLoadBuffered = false; } else { context = primGetNextToken(); if (context == XML_TAG_NAME) { if(containsTagName(yy_buffer, yy_startRead, yy_markedPos-yy_startRead)) fCurrentTagName = yytext(); else fCurrentTagName = null; } else if (context == XML_TAG_OPEN) { fIsBlockingEnabled = true; } else if (context == XML_END_TAG_OPEN) { fIsBlockingEnabled = false; } start = yychar; textLength = length = yylength(); if (yy_atEOF) { fTokenCount++; return null; } } // store the next token f_context = primGetNextToken(); if (f_context == XML_TAG_NAME) { if(containsTagName(yy_buffer, yy_startRead, yy_markedPos-yy_startRead)) fCurrentTagName = yytext(); else fCurrentTagName = null; } else if (f_context == XML_TAG_OPEN) { fIsBlockingEnabled = true; } else if (f_context == XML_END_TAG_OPEN) { fIsBlockingEnabled = false; } fBufferedContext = f_context; fBufferedStart = yychar; fBufferedLength = yylength(); fShouldLoadBuffered = true; if (fBufferedContext == WHITE_SPACE) { fShouldLoadBuffered = false; length += fBufferedLength; } if (context == null) { // EOF if (Debug.debugTokenizer) { System.out.println(getClass().getName() + " discovered " + fTokenCount + " tokens."); //$NON-NLS-2$//$NON-NLS-1$ } return null; } fTokenCount++; return fRegionFactory.createToken(context, start, textLength, length, null, fCurrentTagName); } /* user method */ public HTMLTokenizer(){ super(); } /* user method */ public HTMLTokenizer(char[] charArray){ this(new CharArrayReader(charArray)); } /* user method */ public void reset(char[] charArray) { reset(new CharArrayReader(charArray), 0); } /* user method */ public void reset(char[] charArray, int newOffset) { reset(new CharArrayReader(charArray), newOffset); } /* user method */ public void reset(java.io.InputStream in) { reset(new java.io.InputStreamReader(in), 0); } /* user method */ public void reset(java.io.InputStream in, int newOffset) { reset(new java.io.InputStreamReader(in), newOffset); } /* user method */ public void reset(java.io.Reader in) { reset(in, 0); } /** * user method * * * Reset internal counters and vars to "newly created" values, in the hopes * that resetting a pre-existing tokenizer is faster than creating a new one. * * This method contains code blocks that were essentially duplicated from the * <em>generated</em> output of this specification before this method was * added. Those code blocks were under the above copyright. */ public void reset(java.io.Reader in, int newOffset) { if (Debug.debugTokenizer) { System.out.println("resetting tokenizer");//$NON-NLS-1$ } fOffset = newOffset; /* the input device */ yy_reader = in; /* the current state of the DFA */ yy_state = 0; /* the current lexical state */ yy_lexical_state = YYINITIAL; /* this buffer contains the current text to be matched and is the source of the yytext() string */ java.util.Arrays.fill(yy_buffer, (char)0); /* the textposition at the last accepting state */ yy_markedPos = 0; /* the current text position in the buffer */ yy_currentPos = 0; /* startRead marks the beginning of the yytext() string in the buffer */ yy_startRead = 0; /** * endRead marks the last character in the buffer, that has been read * from input */ yy_endRead = 0; /* number of newlines encountered up to the start of the matched text */ //yyline = 0; /* the number of characters up to the start of the matched text */ yychar = 0; /* yy_atEOF == true <=> the scanner has returned a value for EOF */ yy_atEOF = false; /* denotes if the user-EOF-code has already been executed */ yy_eof_done = false; /* user vars: */ fTokenCount = 0; fShouldLoadBuffered = false; fBufferedContext = null; fBufferedStart = 1; fBufferedLength = 0; fStateStack = new IntStack(); context = null; start = 0; textLength = 0; length = 0; } /** * user method * */ public BlockTokenizer newInstance() { HTMLTokenizer newInstance = new HTMLTokenizer(); // global tagmarkers can be shared; they have no state and // are never destroyed (e.g. 'release') for(int i = 0; i < fBlockMarkers.size(); i++) { BlockMarker blockMarker = (BlockMarker) fBlockMarkers.get(i); if(blockMarker.isGlobal()) newInstance.addBlockMarker(blockMarker); } return newInstance; } /* user method */ private final String scanXMLCommentText() throws IOException { // Scan for '-->' and return the text up to that point as // XML_COMMENT_TEXT unless the string occurs IMMEDIATELY, in which // case change to the ST_XML_COMMENT_END state and return the next // context as usual. return doScan("-->", false, XML_COMMENT_TEXT, ST_XML_COMMENT_END, ST_XML_COMMENT_END); } /** * Creates a new scanner * There is also a java.io.InputStream version of this constructor. * * @param in the java.io.Reader to read input from. */ public HTMLTokenizer(java.io.Reader in) { this.yy_reader = in; } /** * Creates a new scanner. * There is also java.io.Reader version of this constructor. * * @param in the java.io.Inputstream to read input from. */ public HTMLTokenizer(java.io.InputStream in) { this(new java.io.InputStreamReader(in)); } /** * Unpacks the compressed DFA transition table. * * @param packed the packed transition table * @return the unpacked transition table */ private static int [] yy_unpack(String packed) { int [] trans = new int[10175]; int i = 0; /* index in packed string */ int j = 0; /* index in unpacked array */ while (i < 3126) { int count = packed.charAt(i++); int value = packed.charAt(i++); value--; do trans[j++] = value; while (--count > 0); } return trans; } /** * Unpacks the compressed character translation table. * * @param packed the packed character translation table * @return the unpacked character translation table */ private static char [] yy_unpack_cmap(String packed) { char [] map = new char[0x10000]; int i = 0; /* index in packed string */ int j = 0; /* index in unpacked array */ while (i < 1372) { int count = packed.charAt(i++); char value = packed.charAt(i++); do map[j++] = value; while (--count > 0); } return map; } /** * Gets the next input character. * * @return the next character of the input stream, EOF if the * end of the stream is reached. * @exception IOException if any I/O-Error occurs */ private int yy_advance() throws java.io.IOException { /* standard case */ if (yy_currentPos < yy_endRead) return yy_buffer[yy_currentPos++]; /* if the eof is reached, we don't need to work hard */ if (yy_atEOF) return YYEOF; /* otherwise: need to refill the buffer */ /* first: make room (if you can) */ if (yy_startRead > 0) { System.arraycopy(yy_buffer, yy_startRead, yy_buffer, 0, yy_endRead-yy_startRead); /* translate stored positions */ yy_endRead-= yy_startRead; yy_currentPos-= yy_startRead; yy_markedPos-= yy_startRead; yy_startRead = 0; } /* is the buffer big enough? */ if (yy_currentPos >= yy_buffer.length) { /* if not: blow it up */ char newBuffer[] = new char[yy_currentPos*2]; System.arraycopy(yy_buffer, 0, newBuffer, 0, yy_buffer.length); yy_buffer = newBuffer; } /* finally: fill the buffer with new input */ int numRead = yy_reader.read(yy_buffer, yy_endRead, yy_buffer.length-yy_endRead); if ( numRead == -1 ) return YYEOF; yy_endRead+= numRead; return yy_buffer[yy_currentPos++]; } /** * Closes the input stream. */ final public void yyclose() throws java.io.IOException { yy_atEOF = true; /* indicate end of file */ yy_endRead = yy_startRead; /* invalidate buffer */ yy_reader.close(); } /** * Returns the current lexical state. */ final public int yystate() { return yy_lexical_state; } /** * Enters a new lexical state * * @param newState the new lexical state */ final public void yybegin(int newState) { yy_lexical_state = newState; } /** * Returns the text matched by the current regular expression. */ final public String yytext() { return new String( yy_buffer, yy_startRead, yy_markedPos-yy_startRead ); } /** * Returns the length of the matched text region. */ final public int yylength() { return yy_markedPos-yy_startRead; } /** * Reports an error that occured while scanning - from the SED JFlex skeleton * * @param errorCode the code of the errormessage to display */ private void yy_ScanError(int errorCode) { try { Logger.log(Logger.ERROR, YY_ERROR_MSG[errorCode]); } catch (ArrayIndexOutOfBoundsException e) { Logger.log(Logger.ERROR, YY_ERROR_MSG[YY_UNKNOWN_ERROR]); } // DO NOT EXIT the VM on an error // System.exit(1); } /** * Pushes the specified amount of characters back into the input stream. * * They will be read again by then next call of the scanning method * * @param number the number of characters to be read again. * This number must not be greater than yylength()! */ void yypushback(int number) { if ( number > yylength() ) yy_ScanError(YY_PUSHBACK_2BIG); yy_markedPos -= number; } /** * user method - skeleton.sed */ protected final boolean containsTagName(char[] markerTagName, int offset, int tagnameLength) { for(int j = 0; j < fBlockMarkers.size(); j++) { BlockMarker marker = (BlockMarker)fBlockMarkers.get(j); if(marker.getTagName().length() == tagnameLength) { boolean matchesSoFar = true; for(int i = 0; i < tagnameLength && matchesSoFar; i++) { if(marker.isCaseSensitive()) { if(marker.getTagName().charAt(i) != markerTagName[i + offset]) matchesSoFar = false; } else { if(Character.toLowerCase(marker.getTagName().charAt(i)) != Character.toLowerCase(markerTagName[i + offset])) matchesSoFar = false; } } if(matchesSoFar) return true; } } return false; } /** * user method - skeleton.sed * * Return ALL of the regions scannable within the remaining text * Note: for verification use */ public final List getRegions() { List tokens = new ArrayList(); ITextRegion region = null; try { region = getNextToken(); while(region != null) { if (region != null) { tokens.add(region); } region = getNextToken(); } } catch (StackOverflowError e) { Logger.logException(getClass().getName()+": input could not be tokenized correctly at position " + getOffset(), e);//$NON-NLS-1$ throw e; } catch (Exception e) { // Since this is convenience method and NOT the recommended // way of getting tokens, many errors are simply hidden Logger.logException("Exception not handled retrieving regions: " + e.getLocalizedMessage(), e);//$NON-NLS-1$ } return tokens; } /** * user method - skeleton.sed */ private final void dump(String s) { if (Debug.debugTokenizer) { System.out.println(s + " (" + yychar + "-" + //$NON-NLS-2$//$NON-NLS-1$ (yylength() + yychar) + "):\'" +//$NON-NLS-1$ StringUtils.escape(yytext()) + "\'");//$NON-NLS-1$ } } /* user method - skeleton.sed */ public final boolean isEOF() { return yy_atEOF; } /* user method - skeleton.sed */ protected final boolean containsTagName(String markerTagName) { Iterator blocks = fBlockMarkers.iterator(); while(blocks.hasNext()) { BlockMarker marker = (BlockMarker)blocks.next(); if(marker.isCaseSensitive()) { if(marker.getTagName().equals(markerTagName)) return true; } else { if(marker.getTagName().equalsIgnoreCase(markerTagName)) return true; } } return false; } /** * Contains user EOF-code, which will be executed exactly once, * when the end of file is reached */ private void yy_do_eof() { if (!yy_eof_done) { yy_eof_done = true; // do nothing, this is the downstream parser's job } } /** * Resumes scanning until the next regular expression is matched, * the end of input is encountered or an I/O-Error occurs. * * @return the next token * @exception IOException if any I/O-Error occurs */ public String primGetNextToken() throws java.io.IOException { int yy_input; int yy_action; while (true) { yychar+= yylength(); yy_action = -1; yy_currentPos = yy_startRead = yy_markedPos; yy_state = yy_lexical_state; yy_forAction: { while (true) { yy_input = yy_advance(); if ( yy_input == YYEOF ) break yy_forAction; int yy_next = yytrans[ yy_rowMap[yy_state] + yycmap[yy_input] ]; if (yy_next == -1) break yy_forAction; yy_state = yy_next; int yy_attributes = YY_ATTRIBUTE[yy_state]; if ( (yy_attributes & 1) > 0 ) { yy_action = yy_state; yy_markedPos = yy_currentPos; if ( (yy_attributes & 8) > 0 ) break yy_forAction; } } } switch (yy_action) { case 268: { if(Debug.debugTokenizer) dump("XSL processing instruction target");//$NON-NLS-1$ yybegin(ST_XML_PI_ATTRIBUTE_NAME); return XML_TAG_NAME; } case 270: break; case 260: case 262: case 263: { if(Debug.debugTokenizer) dump("\nCDATA start");//$NON-NLS-1$ fStateStack.push(yystate()); yybegin(ST_CDATA_TEXT); return XML_CDATA_OPEN; } case 271: break; case 253: { if(Debug.debugTokenizer) dump("element");//$NON-NLS-1$ yybegin(ST_XML_ELEMENT_DECLARATION); return XML_ELEMENT_DECLARATION; } case 272: break; case 252: { if(Debug.debugTokenizer) dump("attlist");//$NON-NLS-1$ yybegin(ST_XML_ATTLIST_DECLARATION); return XML_ATTLIST_DECLARATION; } case 273: break; case 251: { if(Debug.debugTokenizer) dump("doctype");//$NON-NLS-1$ yybegin(ST_XML_DOCTYPE_DECLARATION); return XML_DOCTYPE_DECLARATION; } case 274: break; case 246: { if(Debug.debugTokenizer) dump("doctype external id");//$NON-NLS-1$ yybegin(ST_XML_DOCTYPE_ID_PUBLIC); return XML_DOCTYPE_EXTERNAL_ID_PUBLIC; } case 275: break; case 245: { if(Debug.debugTokenizer) dump("doctype external id");//$NON-NLS-1$ yybegin(ST_XML_DOCTYPE_ID_SYSTEM); return XML_DOCTYPE_EXTERNAL_ID_SYSTEM; } case 276: break; case 216: { if(Debug.debugTokenizer) dump("\nCharRef");//$NON-NLS-1$ return XML_CHAR_REFERENCE; } case 277: break; case 212: { if(Debug.debugTokenizer) dump("\ncomment start");//$NON-NLS-1$ yybegin(ST_XML_COMMENT); return XML_COMMENT_OPEN; } case 278: break; case 194: case 195: { if(Debug.debugTokenizer) dump("XML processing instruction target");//$NON-NLS-1$ yybegin(ST_XML_PI_ATTRIBUTE_NAME); return XML_TAG_NAME; } case 279: break; case 193: { if(Debug.debugTokenizer) dump("comment end");//$NON-NLS-1$ yybegin(YYINITIAL); return XML_COMMENT_CLOSE; } case 280: break; case 192: { if(Debug.debugTokenizer) dump("CDATA end");//$NON-NLS-1$ yybegin(fStateStack.pop()); return XML_CDATA_CLOSE; } case 281: break; case 191: { if(Debug.debugTokenizer) dump("\nPEReference");//$NON-NLS-1$ return XML_PE_REFERENCE; } case 282: break; case 188: { if(Debug.debugTokenizer) dump("\nEntityRef");//$NON-NLS-1$ return XML_ENTITY_REFERENCE; } case 283: break; case 139: case 144: case 156: { return XML_DOCTYPE_INTERNAL_SUBSET; } case 284: break; case 127: { yybegin(YYINITIAL); if(Debug.debugTokenizer) dump("empty tag close");//$NON-NLS-1$ return XML_EMPTY_TAG_CLOSE; } case 285: break; case 120: { if(Debug.debugTokenizer) dump("XML processing instruction end");//$NON-NLS-1$ yybegin(YYINITIAL); return XML_PI_CLOSE; } case 286: break; case 119: { // ended with nothing inside yybegin(YYINITIAL); return XML_PI_CLOSE; } case 287: break; case 52: case 54: case 55: case 56: case 124: { if(Debug.debugTokenizer) dump("XML processing instruction attribute value");//$NON-NLS-1$ yybegin(ST_XML_PI_ATTRIBUTE_NAME); return XML_TAG_ATTRIBUTE_VALUE; } case 288: break; case 51: { if(Debug.debugTokenizer) dump("XML processing instruction '='");//$NON-NLS-1$ yybegin(ST_XML_PI_ATTRIBUTE_VALUE); return XML_TAG_ATTRIBUTE_EQUALS; } case 289: break; case 50: { if(Debug.debugTokenizer) dump("XML processing instruction attribute name");//$NON-NLS-1$ yybegin(ST_XML_PI_EQUALS); return XML_TAG_ATTRIBUTE_NAME; } case 290: break; case 46: case 47: case 48: { // block scan until close is found return doScan("?>", false, XML_PI_CONTENT, ST_XML_PI_TAG_CLOSE, ST_XML_PI_TAG_CLOSE); } case 291: break; case 45: { yybegin(ST_PI_CONTENT); return WHITE_SPACE; } case 292: break; case 42: case 43: case 44: case 117: case 118: case 218: case 232: case 241: case 250: case 257: case 261: case 264: case 265: case 266: case 267: { if(Debug.debugTokenizer) dump("processing instruction target");//$NON-NLS-1$ yybegin(ST_PI_WS); return XML_TAG_NAME; } case 293: break; case 37: case 38: { if(Debug.debugTokenizer) dump("comment content");//$NON-NLS-1$ return scanXMLCommentText(); } case 294: break; case 36: { if(Debug.debugTokenizer) dump("LINE FEED");//$NON-NLS-1$ return WHITE_SPACE; } case 295: break; case 31: case 32: { if(Debug.debugTokenizer) dump("CDATA text");//$NON-NLS-1$ String blockContext = doBlockScan("]]>", XML_CDATA_TEXT, ST_CDATA_END);//$NON-NLS-1$ if(blockContext == XML_CDATA_TEXT) yybegin(ST_CDATA_END); return blockContext; } case 296: break; case 0: case 27: case 109: case 110: case 111: case 186: case 187: case 189: case 190: case 214: case 215: case 217: case 230: case 231: { if(Debug.debugTokenizer) dump("\nXML content");//$NON-NLS-1$ return XML_CONTENT; } case 297: break; case 5: case 8: case 9: case 10: case 13: case 14: case 15: case 16: case 17: case 18: case 19: case 20: case 21: case 22: case 24: case 41: { if(Debug.debugTokenizer) dump("white space");//$NON-NLS-1$ return WHITE_SPACE; } case 298: break; case 12: case 58: { if(Debug.debugTokenizer) dump("inappropriate tag name");//$NON-NLS-1$ yybegin(YYINITIAL); return XML_CONTENT; } case 299: break; case 23: case 93: case 94: case 172: case 207: case 226: case 238: case 247: case 254: case 258: { if(Debug.debugTokenizer) dump("elementdecl contentspec");//$NON-NLS-1$ return XML_ELEMENT_DECL_CONTENT; } case 300: break; case 25: case 100: case 101: case 183: case 211: case 228: case 239: case 248: case 255: case 259: { if(Debug.debugTokenizer) dump("attlist contentspec");//$NON-NLS-1$ return XML_ATTLIST_DECL_CONTENT; } case 301: break; case 28: case 59: case 70: { if(Debug.debugTokenizer) dump("\nstart tag open");//$NON-NLS-1$ yybegin(ST_XML_TAG_NAME); return XML_TAG_OPEN; } case 302: break; case 29: case 33: case 34: case 35: case 39: case 40: case 49: case 53: case 57: case 61: case 67: case 72: case 73: case 74: case 75: case 77: case 78: case 80: case 85: case 90: case 97: { if (Debug.debugTokenizer) System.out.println("!!!unexpected!!!: \"" + yytext() + "\":" + //$NON-NLS-2$//$NON-NLS-1$ yychar + "-" + (yychar + yylength()));//$NON-NLS-1$ return UNDEFINED; } case 303: break; case 30: case 112: { if(Debug.debugTokenizer) dump("non-reference %");//$NON-NLS-1$ return XML_CONTENT; } case 304: break; case 60: { if(Debug.debugTokenizer) dump("tag close");//$NON-NLS-1$ if(isBlockMarker()) { yybegin(ST_BLOCK_TAG_SCAN); } else yybegin(YYINITIAL); return XML_TAG_CLOSE; } case 305: break; case 62: case 63: { if(Debug.debugTokenizer) dump("tag name");//$NON-NLS-1$ yybegin(ST_XML_ATTRIBUTE_NAME); return XML_TAG_NAME; } case 306: break; case 64: { if(Debug.debugTokenizer) dump("attr name");//$NON-NLS-1$ yybegin(ST_XML_EQUALS); return XML_TAG_ATTRIBUTE_NAME; } case 307: break; case 65: { if(Debug.debugTokenizer) dump("equals");//$NON-NLS-1$ yybegin(ST_XML_ATTRIBUTE_VALUE); return XML_TAG_ATTRIBUTE_EQUALS; } case 308: break; case 66: case 68: case 69: case 131: { if(Debug.debugTokenizer) dump("attr value");//$NON-NLS-1$ yybegin(ST_XML_ATTRIBUTE_NAME); return XML_TAG_ATTRIBUTE_VALUE; } case 309: break; case 71: { if(Debug.debugTokenizer) dump("declaration end");//$NON-NLS-1$ if (Debug.debugTokenizer) { if(fStateStack.peek()!=YYINITIAL) System.out.println("end embedded region");//$NON-NLS-1$ } yybegin(fStateStack.pop()); return XML_DECLARATION_CLOSE; } case 310: break; case 76: { if(Debug.debugTokenizer) dump("doctype type");//$NON-NLS-1$ yybegin(ST_XML_DOCTYPE_EXTERNAL_ID); return XML_DOCTYPE_NAME; } case 311: break; case 79: case 81: case 82: case 83: case 147: case 148: case 151: case 152: case 202: { if(Debug.debugTokenizer) dump("doctype public reference");//$NON-NLS-1$ yybegin(ST_XML_DOCTYPE_ID_SYSTEM); return XML_DOCTYPE_EXTERNAL_ID_PUBREF; } case 312: break; case 84: case 86: case 87: case 88: case 159: { if(Debug.debugTokenizer) dump("doctype system reference");//$NON-NLS-1$ yybegin(ST_XML_DECLARATION_CLOSE); return XML_DOCTYPE_EXTERNAL_ID_SYSREF; } case 313: break; case 89: case 91: case 92: case 165: case 166: case 169: case 170: case 205: { if(Debug.debugTokenizer) dump("elementdecl name");//$NON-NLS-1$ yybegin(ST_XML_ELEMENT_DECLARATION_CONTENT); return XML_ELEMENT_DECL_NAME; } case 314: break; case 95: { if(Debug.debugTokenizer) dump("elementdecl close");//$NON-NLS-1$ if (Debug.debugTokenizer) { if(fStateStack.peek()!=YYINITIAL) System.out.println("end embedded region");//$NON-NLS-1$ } yybegin(fStateStack.pop()); return XML_DECLARATION_CLOSE; } case 315: break; case 96: case 98: case 99: case 176: case 177: case 180: case 181: case 209: { if(Debug.debugTokenizer) dump("attlist name");//$NON-NLS-1$ yybegin(ST_XML_ATTLIST_DECLARATION_CONTENT); return XML_ATTLIST_DECL_NAME; } case 316: break; case 102: { if(Debug.debugTokenizer) dump("attlist close");//$NON-NLS-1$ if (Debug.debugTokenizer) { if(fStateStack.peek()!=YYINITIAL) System.out.println("end embedded region");//$NON-NLS-1$ } yybegin(fStateStack.pop()); return XML_DECLARATION_CLOSE; } case 317: break; case 105: { if(Debug.debugTokenizer) dump("\nend tag open");//$NON-NLS-1$ yybegin(ST_XML_TAG_NAME); return XML_END_TAG_OPEN; } case 318: break; case 106: { if(Debug.debugTokenizer) dump("\nprocessing instruction start");//$NON-NLS-1$ yybegin(ST_PI); return XML_PI_OPEN; } case 319: break; case 107: { fStateStack.push(yystate()); if(Debug.debugTokenizer) dump("\ndeclaration start");//$NON-NLS-1$ yybegin(ST_XML_DECLARATION); return XML_DECLARATION_OPEN; } case 320: break; case 116: { if(Debug.debugTokenizer) dump("processing instruction end");//$NON-NLS-1$ yybegin(YYINITIAL); return XML_PI_CLOSE; } case 321: break; case 103: case 104: { return doBlockTagScan(); } case 322: break; default: if (yy_input == YYEOF && yy_startRead == yy_currentPos) { yy_atEOF = true; yy_do_eof(); return null; } else { yy_ScanError(YY_NO_MATCH); } } } } }