package org.apache.lucene; /** * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ import java.io.IOException; import java.io.PrintWriter; import java.io.StringWriter; import java.util.Random; import org.apache.lucene.store.*; import org.apache.lucene.document.*; import org.apache.lucene.analysis.*; import org.apache.lucene.index.*; import org.apache.lucene.search.*; import org.apache.lucene.queryParser.*; import org.apache.lucene.util.LuceneTestCase; import junit.framework.TestSuite; import junit.textui.TestRunner; public class TestSearchForDuplicates extends LuceneTestCase { /** Main for running test case by itself. */ public static void main(String args[]) { TestRunner.run (new TestSuite(TestSearchForDuplicates.class)); } static final String PRIORITY_FIELD ="priority"; static final String ID_FIELD ="id"; static final String HIGH_PRIORITY ="high"; static final String MED_PRIORITY ="medium"; static final String LOW_PRIORITY ="low"; /** This test compares search results when using and not using compound * files. * * TODO: There is rudimentary search result validation as well, but it is * simply based on asserting the output observed in the old test case, * without really knowing if the output is correct. Someone needs to * validate this output and make any changes to the checkHits method. */ public void testRun() throws Exception { StringWriter sw = new StringWriter(); PrintWriter pw = new PrintWriter(sw, true); Random random = newRandom(); doTest(random, pw, false); pw.close(); sw.close(); String multiFileOutput = sw.getBuffer().toString(); //System.out.println(multiFileOutput); sw = new StringWriter(); pw = new PrintWriter(sw, true); doTest(random, pw, true); pw.close(); sw.close(); String singleFileOutput = sw.getBuffer().toString(); assertEquals(multiFileOutput, singleFileOutput); } private void doTest(Random random, PrintWriter out, boolean useCompoundFiles) throws Exception { Directory directory = newDirectory(random); Analyzer analyzer = new MockAnalyzer(); IndexWriterConfig conf = newIndexWriterConfig(random, TEST_VERSION_CURRENT, analyzer); LogMergePolicy lmp = (LogMergePolicy) conf.getMergePolicy(); lmp.setUseCompoundFile(useCompoundFiles); lmp.setUseCompoundDocStore(useCompoundFiles); IndexWriter writer = new IndexWriter(directory, conf); final int MAX_DOCS = 225; for (int j = 0; j < MAX_DOCS; j++) { Document d = new Document(); d.add(new Field(PRIORITY_FIELD, HIGH_PRIORITY, Field.Store.YES, Field.Index.ANALYZED)); // NOTE: this ID_FIELD produces no tokens since // MockAnalyzer discards numbers d.add(new Field(ID_FIELD, Integer.toString(j), Field.Store.YES, Field.Index.ANALYZED)); writer.addDocument(d); } writer.close(); // try a search without OR Searcher searcher = new IndexSearcher(directory, true); QueryParser parser = new QueryParser(TEST_VERSION_CURRENT, PRIORITY_FIELD, analyzer); Query query = parser.parse(HIGH_PRIORITY); out.println("Query: " + query.toString(PRIORITY_FIELD)); ScoreDoc[] hits = searcher.search(query, null, MAX_DOCS).scoreDocs; printHits(out, hits, searcher); checkHits(hits, MAX_DOCS, searcher); searcher.close(); // try a new search with OR searcher = new IndexSearcher(directory, true); hits = null; parser = new QueryParser(TEST_VERSION_CURRENT, PRIORITY_FIELD, analyzer); query = parser.parse(HIGH_PRIORITY + " OR " + MED_PRIORITY); out.println("Query: " + query.toString(PRIORITY_FIELD)); hits = searcher.search(query, null, MAX_DOCS).scoreDocs; printHits(out, hits, searcher); checkHits(hits, MAX_DOCS, searcher); searcher.close(); directory.close(); } private void printHits(PrintWriter out, ScoreDoc[] hits, Searcher searcher ) throws IOException { out.println(hits.length + " total results\n"); for (int i = 0 ; i < hits.length; i++) { if ( i < 10 || (i > 94 && i < 105) ) { Document d = searcher.doc(hits[i].doc); out.println(i + " " + d.get(ID_FIELD)); } } } private void checkHits(ScoreDoc[] hits, int expectedCount, Searcher searcher) throws IOException { assertEquals("total results", expectedCount, hits.length); for (int i = 0 ; i < hits.length; i++) { if ( i < 10 || (i > 94 && i < 105) ) { Document d = searcher.doc(hits[i].doc); assertEquals("check " + i, String.valueOf(i), d.get(ID_FIELD)); } } } }