package com.antbrains.wordseg.luceneanalyzer; /** * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ import java.io.Reader; import java.io.IOException; interface StandardTokenizerInterface { /** This character denotes the end of file */ public static final int YYEOF = -1; /** * Copies the matched text into the CharTermAttribute */ void getText(CharTermAttribute t); /** * Returns the current position. */ int yychar(); /** * Resets the scanner to read from a new input stream. Does not close the old reader. * * All internal variables are reset, the old input stream <b>cannot</b> be reused (internal buffer * is discarded and lost). Lexical state is set to <tt>ZZ_INITIAL</tt>. * * @param reader * the new input stream */ void yyreset(Reader reader); /** * Returns the length of the matched text region. */ int yylength(); /** * Resumes scanning until the next regular expression is matched, the end of input is encountered * or an I/O-Error occurs. * * @return the next token, {@link #YYEOF} on end of stream * @exception IOException * if any I/O-Error occurs */ int getNextToken() throws IOException; }