/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.lucene.analysis.charfilter; import org.apache.lucene.analysis.CharFilter; import org.apache.lucene.util.ArrayUtil; import java.io.Reader; import java.util.Arrays; /** * Base utility class for implementing a {@link CharFilter}. * You subclass this, and then record mappings by calling * {@link #addOffCorrectMap}, and then invoke the correct * method to correct an offset. */ public abstract class BaseCharFilter extends CharFilter { private int offsets[]; private int diffs[]; private int size = 0; public BaseCharFilter(Reader in) { super(in); } /** Retrieve the corrected offset. */ @Override protected int correct(int currentOff) { if (offsets == null) { return currentOff; } int index = Arrays.binarySearch(offsets, 0, size, currentOff); if (index < -1) { index = -2 - index; } final int diff = index < 0 ? 0 : diffs[index]; return currentOff + diff; } protected int getLastCumulativeDiff() { return offsets == null ? 0 : diffs[size-1]; } /** * <p> * Adds an offset correction mapping at the given output stream offset. * </p> * <p> * Assumption: the offset given with each successive call to this method * will not be smaller than the offset given at the previous invocation. * </p> * * @param off The output stream offset at which to apply the correction * @param cumulativeDiff The input offset is given by adding this * to the output offset */ protected void addOffCorrectMap(int off, int cumulativeDiff) { if (offsets == null) { offsets = new int[64]; diffs = new int[64]; } else if (size == offsets.length) { offsets = ArrayUtil.grow(offsets); diffs = ArrayUtil.grow(diffs); } assert (size == 0 || off >= offsets[size - 1]) : "Offset #" + size + "(" + off + ") is less than the last recorded offset " + offsets[size - 1] + "\n" + Arrays.toString(offsets) + "\n" + Arrays.toString(diffs); if (size == 0 || off != offsets[size - 1]) { offsets[size] = off; diffs[size++] = cumulativeDiff; } else { // Overwrite the diff at the last recorded offset diffs[size - 1] = cumulativeDiff; } } }