/* * Copyright 2007 T-Rank AS * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package no.trank.openpipe.solr.analysis; import java.io.IOException; import java.util.ListIterator; import java.util.Set; import org.apache.lucene.analysis.Token; import org.apache.lucene.analysis.TokenStream; import no.trank.openpipe.api.document.AnnotatedField; import no.trank.openpipe.api.document.ResolvedAnnotation; /** * @version $Revision$ */ public class AnnotationTokenStream extends TokenStream { private ResolvedAnnotation[] anns; private ListIterator<ResolvedAnnotation>[] iterators; private String[] types; private int lastEnd = -1; public AnnotationTokenStream(AnnotatedField doc) { this(doc, doc.getAnnotationTypes()); } @SuppressWarnings({"unchecked"}) public AnnotationTokenStream(AnnotatedField doc, Set<String> annotations) { types = annotations.toArray(new String[annotations.size()]); anns = new ResolvedAnnotation[annotations.size()]; iterators = new ListIterator[annotations.size()]; for (int i = 0; i < types.length; i++) { final ListIterator<ResolvedAnnotation> it = doc.iterator(types[i]); iterators[i] = it; anns[i] = nextOrNull(it); } } @Override public Token next() throws IOException { int idx = 0; ResolvedAnnotation ann = anns[idx]; for (int i = 1; i < anns.length; i++) { final ResolvedAnnotation a2 = anns[i]; if (a2 != null && (ann == null || a2.getStartPos() < ann.getStartPos() || a2.getStartPos() == ann.getStartPos() && a2.getEndPos() < ann.getEndPos())) { ann = a2; idx = i; } } if (ann != null) { anns[idx] = nextOrNull(iterators[idx]); final boolean noIncr = lastEnd == ann.getEndPos(); lastEnd = ann.getEndPos(); if (ann instanceof Token) { return (Token) ann; } final Token token = new Token(ann.getValue(), ann.getStartPos(), lastEnd, types[idx]); if (noIncr) { token.setPositionIncrement(0); } return token; } return null; } private static ResolvedAnnotation nextOrNull(ListIterator<ResolvedAnnotation> it) { return it.hasNext() ? it.next() : null; } }