/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.lucene.index; import java.text.DecimalFormat; import java.text.DecimalFormatSymbols; import java.text.NumberFormat; import java.util.Locale; import org.apache.lucene.analysis.MockAnalyzer; import org.apache.lucene.analysis.MockTokenizer; import org.apache.lucene.document.Document; import org.apache.lucene.document.Field; import org.apache.lucene.index.IndexWriterConfig.OpenMode; import org.apache.lucene.store.Directory; import org.apache.lucene.util.Bits; import org.apache.lucene.util.LuceneTestCase; public class TestPKIndexSplitter extends LuceneTestCase { public void testSplit() throws Exception { NumberFormat format = new DecimalFormat("000000000", DecimalFormatSymbols.getInstance(Locale.ROOT)); Directory dir = newDirectory(); IndexWriter w = new IndexWriter(dir, newIndexWriterConfig(new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false)) .setOpenMode(OpenMode.CREATE).setMergePolicy(NoMergePolicy.INSTANCE)); for (int x = 0; x < 11; x++) { Document doc = createDocument(x, "1", 3, format); w.addDocument(doc); if (x%3==0) w.commit(); } for (int x = 11; x < 20; x++) { Document doc = createDocument(x, "2", 3, format); w.addDocument(doc); if (x%3==0) w.commit(); } w.close(); final Term midTerm = new Term("id", format.format(11)); checkSplitting(dir, midTerm, 11, 9); // delete some documents w = new IndexWriter(dir, newIndexWriterConfig(new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false)) .setOpenMode(OpenMode.APPEND).setMergePolicy(NoMergePolicy.INSTANCE)); w.deleteDocuments(midTerm); w.deleteDocuments(new Term("id", format.format(2))); w.close(); checkSplitting(dir, midTerm, 10, 8); dir.close(); } private void checkSplitting(Directory dir, Term splitTerm, int leftCount, int rightCount) throws Exception { Directory dir1 = newDirectory(); Directory dir2 = newDirectory(); PKIndexSplitter splitter = new PKIndexSplitter(dir, dir1, dir2, splitTerm, newIndexWriterConfig(new MockAnalyzer(random())), newIndexWriterConfig(new MockAnalyzer(random()))); splitter.split(); IndexReader ir1 = DirectoryReader.open(dir1); IndexReader ir2 = DirectoryReader.open(dir2); assertEquals(leftCount, ir1.numDocs()); assertEquals(rightCount, ir2.numDocs()); checkContents(ir1, "1"); checkContents(ir2, "2"); ir1.close(); ir2.close(); dir1.close(); dir2.close(); } private void checkContents(IndexReader ir, String indexname) throws Exception { final Bits liveDocs = MultiFields.getLiveDocs(ir); for (int i = 0; i < ir.maxDoc(); i++) { if (liveDocs == null || liveDocs.get(i)) { assertEquals(indexname, ir.document(i).get("indexname")); } } } private Document createDocument(int n, String indexName, int numFields, NumberFormat format) { StringBuilder sb = new StringBuilder(); Document doc = new Document(); String id = format.format(n); doc.add(newStringField("id", id, Field.Store.YES)); doc.add(newStringField("indexname", indexName, Field.Store.YES)); sb.append("a"); sb.append(n); doc.add(newTextField("field1", sb.toString(), Field.Store.YES)); sb.append(" b"); sb.append(n); for (int i = 1; i < numFields; i++) { doc.add(newTextField("field" + (i + 1), sb.toString(), Field.Store.YES)); } return doc; } }