/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.lucene.codecs.asserting; import java.io.IOException; import java.util.Collection; import java.util.Iterator; import org.apache.lucene.codecs.FieldsConsumer; import org.apache.lucene.codecs.FieldsProducer; import org.apache.lucene.codecs.PostingsFormat; import org.apache.lucene.index.AssertingLeafReader; import org.apache.lucene.index.FieldInfo; import org.apache.lucene.index.Fields; import org.apache.lucene.index.IndexOptions; import org.apache.lucene.index.IndexWriter; import org.apache.lucene.index.PostingsEnum; import org.apache.lucene.index.SegmentReadState; import org.apache.lucene.index.SegmentWriteState; import org.apache.lucene.index.Terms; import org.apache.lucene.index.TermsEnum; import org.apache.lucene.util.Accountable; import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.BytesRefBuilder; import org.apache.lucene.util.TestUtil; /** * Just like the default postings format but with additional asserts. */ public final class AssertingPostingsFormat extends PostingsFormat { private final PostingsFormat in = TestUtil.getDefaultPostingsFormat(); public AssertingPostingsFormat() { super("Asserting"); } @Override public FieldsConsumer fieldsConsumer(SegmentWriteState state) throws IOException { return new AssertingFieldsConsumer(state, in.fieldsConsumer(state)); } @Override public FieldsProducer fieldsProducer(SegmentReadState state) throws IOException { return new AssertingFieldsProducer(in.fieldsProducer(state)); } static class AssertingFieldsProducer extends FieldsProducer { private final FieldsProducer in; AssertingFieldsProducer(FieldsProducer in) { this.in = in; // do a few simple checks on init assert toString() != null; assert ramBytesUsed() >= 0; assert getChildResources() != null; } @Override public void close() throws IOException { in.close(); in.close(); // close again } @Override public Iterator<String> iterator() { Iterator<String> iterator = in.iterator(); assert iterator != null; return iterator; } @Override public Terms terms(String field) throws IOException { Terms terms = in.terms(field); return terms == null ? null : new AssertingLeafReader.AssertingTerms(terms); } @Override public int size() { return in.size(); } @Override public long ramBytesUsed() { long v = in.ramBytesUsed(); assert v >= 0; return v; } @Override public Collection<Accountable> getChildResources() { Collection<Accountable> res = in.getChildResources(); TestUtil.checkReadOnly(res); return res; } @Override public void checkIntegrity() throws IOException { in.checkIntegrity(); } @Override public FieldsProducer getMergeInstance() throws IOException { return new AssertingFieldsProducer(in.getMergeInstance()); } @Override public String toString() { return getClass().getSimpleName() + "(" + in.toString() + ")"; } } static class AssertingFieldsConsumer extends FieldsConsumer { private final FieldsConsumer in; private final SegmentWriteState writeState; AssertingFieldsConsumer(SegmentWriteState writeState, FieldsConsumer in) { this.writeState = writeState; this.in = in; } @Override public void write(Fields fields) throws IOException { in.write(fields); // TODO: more asserts? can we somehow run a // "limited" CheckIndex here??? Or ... can we improve // AssertingFieldsProducer and us it also to wrap the // incoming Fields here? String lastField = null; for(String field : fields) { FieldInfo fieldInfo = writeState.fieldInfos.fieldInfo(field); assert fieldInfo != null; assert lastField == null || lastField.compareTo(field) < 0; lastField = field; Terms terms = fields.terms(field); if (terms == null) { continue; } assert terms != null; TermsEnum termsEnum = terms.iterator(); BytesRefBuilder lastTerm = null; PostingsEnum postingsEnum = null; boolean hasFreqs = fieldInfo.getIndexOptions().compareTo(IndexOptions.DOCS_AND_FREQS) >= 0; boolean hasPositions = fieldInfo.getIndexOptions().compareTo(IndexOptions.DOCS_AND_FREQS_AND_POSITIONS) >= 0; boolean hasOffsets = fieldInfo.getIndexOptions().compareTo(IndexOptions.DOCS_AND_FREQS_AND_POSITIONS_AND_OFFSETS) >= 0; boolean hasPayloads = terms.hasPayloads(); assert hasPositions == terms.hasPositions(); assert hasOffsets == terms.hasOffsets(); while(true) { BytesRef term = termsEnum.next(); if (term == null) { break; } assert lastTerm == null || lastTerm.get().compareTo(term) < 0; if (lastTerm == null) { lastTerm = new BytesRefBuilder(); lastTerm.append(term); } else { lastTerm.copyBytes(term); } int flags = 0; if (hasPositions == false) { if (hasFreqs) { flags = flags | PostingsEnum.FREQS; } postingsEnum = termsEnum.postings(postingsEnum, flags); } else { flags = PostingsEnum.POSITIONS; if (hasPayloads) { flags |= PostingsEnum.PAYLOADS; } if (hasOffsets) { flags = flags | PostingsEnum.OFFSETS; } postingsEnum = termsEnum.postings(postingsEnum, flags); } assert postingsEnum != null : "termsEnum=" + termsEnum + " hasPositions=" + hasPositions; int lastDocID = -1; while(true) { int docID = postingsEnum.nextDoc(); if (docID == PostingsEnum.NO_MORE_DOCS) { break; } assert docID > lastDocID; lastDocID = docID; if (hasFreqs) { int freq = postingsEnum.freq(); assert freq > 0; if (hasPositions) { int lastPos = -1; int lastStartOffset = -1; for(int i=0;i<freq;i++) { int pos = postingsEnum.nextPosition(); assert pos >= lastPos: "pos=" + pos + " vs lastPos=" + lastPos + " i=" + i + " freq=" + freq; assert pos <= IndexWriter.MAX_POSITION: "pos=" + pos + " is > IndexWriter.MAX_POSITION=" + IndexWriter.MAX_POSITION; lastPos = pos; if (hasOffsets) { int startOffset = postingsEnum.startOffset(); int endOffset = postingsEnum.endOffset(); assert endOffset >= startOffset; assert startOffset >= lastStartOffset; lastStartOffset = startOffset; } } } } } } } } @Override public void close() throws IOException { in.close(); in.close(); // close again } } }