package lia.tools;
/**
* Copyright Manning Publications Co.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific lan
*/
import junit.framework.TestCase;
import org.apache.lucene.store.RAMDirectory;
import org.apache.lucene.index.IndexWriter;
import org.apache.lucene.index.Term;
import org.apache.lucene.search.Query;
import org.apache.lucene.search.BooleanQuery;
import org.apache.lucene.search.BooleanClause;
import org.apache.lucene.search.TermQuery;
import org.apache.lucene.search.IndexSearcher;
import org.apache.lucene.search.TermRangeFilter;
import org.apache.lucene.search.QueryWrapperFilter;
import org.apache.lucene.search.CachingWrapperFilter;
import org.apache.lucene.search.Filter;
import org.apache.lucene.search.TopDocs;
import org.apache.lucene.document.Document;
import org.apache.lucene.document.DateTools;
import org.apache.lucene.document.Field;
import org.apache.lucene.analysis.WhitespaceAnalyzer;
import org.apache.lucene.misc.ChainedFilter;
import java.util.Calendar;
import lia.common.TestUtil;
// From chapter 9
public class ChainedFilterTest extends TestCase {
public static final int MAX = 500;
private RAMDirectory directory;
private IndexSearcher searcher;
private Query query;
private Filter dateFilter;
private Filter bobFilter;
private Filter sueFilter;
public void setUp() throws Exception {
directory = new RAMDirectory();
IndexWriter writer =
new IndexWriter(directory, new WhitespaceAnalyzer(),
IndexWriter.MaxFieldLength.UNLIMITED);
Calendar cal = Calendar.getInstance();
cal.set(2009, 1, 1, 0, 0); // A
for (int i = 0; i < MAX; i++) {
Document doc = new Document();
doc.add(new Field("key", "" + (i + 1),
Field.Store.YES, Field.Index.NOT_ANALYZED));
doc.add(new Field("owner", (i < MAX / 2) ? "bob" : "sue",
Field.Store.YES, Field.Index.NOT_ANALYZED));
doc.add(new Field("date", DateTools.timeToString(cal.getTimeInMillis(), DateTools.Resolution.DAY),
Field.Store.YES, Field.Index.NOT_ANALYZED));
writer.addDocument(doc);
cal.add(Calendar.DATE, 1);
}
writer.close();
searcher = new IndexSearcher(directory);
BooleanQuery bq = new BooleanQuery(); // B
bq.add(new TermQuery(new Term("owner", "bob")), // B
BooleanClause.Occur.SHOULD); // B
bq.add(new TermQuery(new Term("owner", "sue")), // B
BooleanClause.Occur.SHOULD); // B
query = bq;
cal.set(2099, 1, 1, 0, 0);
dateFilter = TermRangeFilter.Less("date", // C
DateTools.timeToString( // C
cal.getTimeInMillis(), // C
DateTools.Resolution.DAY));// C
bobFilter = new CachingWrapperFilter( // D
new QueryWrapperFilter( // D
new TermQuery(new Term("owner", "bob")))); // D
sueFilter = new CachingWrapperFilter( // E
new QueryWrapperFilter( // E
new TermQuery(new Term("owner", "sue")))); // E
}
/*
#A 2009 January 01
#B BooleanQuery that matches all documents
#C Date filter also matches all documents
#D Matches only Bob's documents
#E Matches only Sue's documents
*/
public void testSingleFilter() throws Exception {
ChainedFilter chain = new ChainedFilter(
new Filter[] {dateFilter});
TopDocs hits = searcher.search(query, chain, 10);
assertEquals(MAX, hits.totalHits);
chain = new ChainedFilter(new Filter[] {bobFilter});
assertEquals(MAX / 2, TestUtil.hitCount(searcher, query, chain), hits.totalHits);
}
public void testOR() throws Exception {
ChainedFilter chain = new ChainedFilter(
new Filter[] {sueFilter, bobFilter});
assertEquals("OR matches all", MAX, TestUtil.hitCount(searcher, query, chain));
}
public void testAND() throws Exception {
ChainedFilter chain = new ChainedFilter(
new Filter[] {dateFilter, bobFilter}, ChainedFilter.AND);
TopDocs hits = searcher.search(query, chain, 10);
assertEquals("AND matches just Bob", MAX / 2, hits.totalHits);
Document firstDoc = searcher.doc(hits.scoreDocs[0].doc);
assertEquals("bob", firstDoc.get("owner"));
}
public void testXOR() throws Exception {
ChainedFilter chain = new ChainedFilter(
new Filter[]{dateFilter, bobFilter}, ChainedFilter.XOR);
TopDocs hits = searcher.search(query, chain, 10);
assertEquals("XOR matches Sue", MAX / 2, hits.totalHits);
Document firstDoc = searcher.doc(hits.scoreDocs[0].doc);
assertEquals("sue", firstDoc.get("owner"));
}
public void testANDNOT() throws Exception {
ChainedFilter chain = new ChainedFilter(
new Filter[]{dateFilter, sueFilter},
new int[] {ChainedFilter.AND, ChainedFilter.ANDNOT});
TopDocs hits = searcher.search(query, chain, 10);
assertEquals("ANDNOT matches just Bob",
MAX / 2, hits.totalHits);
Document firstDoc = searcher.doc(hits.scoreDocs[0].doc);
assertEquals("bob", firstDoc.get("owner"));
}
}