package org.apache.lucene.facet.search; import java.io.IOException; import java.util.Iterator; import java.util.List; import org.apache.lucene.analysis.MockAnalyzer; import org.apache.lucene.analysis.MockTokenizer; import org.apache.lucene.facet.FacetTestUtils; import org.apache.lucene.facet.index.params.CategoryListParams; import org.apache.lucene.facet.index.params.FacetIndexingParams; import org.apache.lucene.facet.index.params.PerDimensionIndexingParams; import org.apache.lucene.facet.search.params.CountFacetRequest; import org.apache.lucene.facet.search.params.FacetSearchParams; import org.apache.lucene.facet.search.results.FacetResult; import org.apache.lucene.facet.search.results.FacetResultNode; import org.apache.lucene.facet.taxonomy.CategoryPath; import org.apache.lucene.facet.taxonomy.TaxonomyReader; import org.apache.lucene.facet.taxonomy.TaxonomyWriter; import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyReader; import org.apache.lucene.facet.taxonomy.directory.DirectoryTaxonomyWriter; import org.apache.lucene.index.DocsEnum; import org.apache.lucene.index.IndexReader; import org.apache.lucene.index.IndexWriterConfig.OpenMode; import org.apache.lucene.index.MultiFields; import org.apache.lucene.index.RandomIndexWriter; import org.apache.lucene.index.Term; import org.apache.lucene.search.DocIdSetIterator; import org.apache.lucene.search.IndexSearcher; import org.apache.lucene.search.MatchAllDocsQuery; import org.apache.lucene.search.MultiCollector; import org.apache.lucene.search.Query; import org.apache.lucene.search.TopScoreDocCollector; import org.apache.lucene.store.Directory; import org.apache.lucene.util.BytesRef; import org.apache.lucene.util.IOUtils; import org.apache.lucene.util.LuceneTestCase; import org.apache.lucene.util._TestUtil; import org.junit.Test; /* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ public class TestMultipleCategoryLists extends LuceneTestCase { @Test public void testDefault() throws Exception { Directory[][] dirs = getDirs(); // create and open an index writer RandomIndexWriter iw = new RandomIndexWriter(random(), dirs[0][0], newIndexWriterConfig( TEST_VERSION_CURRENT, new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false))); // create and open a taxonomy writer TaxonomyWriter tw = new DirectoryTaxonomyWriter(dirs[0][1], OpenMode.CREATE); /** * Configure with no custom counting lists */ PerDimensionIndexingParams iParams = new PerDimensionIndexingParams(); seedIndex(iw, tw, iParams); IndexReader ir = iw.getReader(); tw.commit(); // prepare index reader and taxonomy. TaxonomyReader tr = new DirectoryTaxonomyReader(dirs[0][1]); // prepare searcher to search against IndexSearcher searcher = newSearcher(ir); FacetsCollector facetsCollector = performSearch(iParams, tr, ir, searcher); // Obtain facets results and hand-test them assertCorrectResults(facetsCollector); DocsEnum td = _TestUtil.docs(random(), ir, "$facets", new BytesRef("$fulltree$"), MultiFields.getLiveDocs(ir), null, 0); assertTrue(td.nextDoc() != DocIdSetIterator.NO_MORE_DOCS); tr.close(); ir.close(); iw.close(); tw.close(); IOUtils.close(dirs[0]); } @Test public void testCustom() throws Exception { Directory[][] dirs = getDirs(); // create and open an index writer RandomIndexWriter iw = new RandomIndexWriter(random(), dirs[0][0], newIndexWriterConfig( TEST_VERSION_CURRENT, new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false))); // create and open a taxonomy writer TaxonomyWriter tw = new DirectoryTaxonomyWriter(dirs[0][1], OpenMode.CREATE); PerDimensionIndexingParams iParams = new PerDimensionIndexingParams(); iParams.addCategoryListParams(new CategoryPath("Author"), new CategoryListParams(new Term("$author", "Authors"))); seedIndex(iw, tw, iParams); IndexReader ir = iw.getReader(); tw.commit(); // prepare index reader and taxonomy. TaxonomyReader tr = new DirectoryTaxonomyReader(dirs[0][1]); // prepare searcher to search against IndexSearcher searcher = newSearcher(ir); FacetsCollector facetsCollector = performSearch(iParams, tr, ir, searcher); // Obtain facets results and hand-test them assertCorrectResults(facetsCollector); assertPostingListExists("$facets", "$fulltree$", ir); assertPostingListExists("$author", "Authors", ir); tr.close(); ir.close(); iw.close(); tw.close(); IOUtils.close(dirs[0]); } @Test public void testTwoCustomsSameField() throws Exception { Directory[][] dirs = getDirs(); // create and open an index writer RandomIndexWriter iw = new RandomIndexWriter(random(), dirs[0][0], newIndexWriterConfig( TEST_VERSION_CURRENT, new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false))); // create and open a taxonomy writer TaxonomyWriter tw = new DirectoryTaxonomyWriter(dirs[0][1], OpenMode.CREATE); PerDimensionIndexingParams iParams = new PerDimensionIndexingParams(); iParams.addCategoryListParams(new CategoryPath("Band"), new CategoryListParams(new Term("$music", "Bands"))); iParams.addCategoryListParams(new CategoryPath("Composer"), new CategoryListParams(new Term("$music", "Composers"))); seedIndex(iw, tw, iParams); IndexReader ir = iw.getReader(); tw.commit(); // prepare index reader and taxonomy. TaxonomyReader tr = new DirectoryTaxonomyReader(dirs[0][1]); // prepare searcher to search against IndexSearcher searcher = newSearcher(ir); FacetsCollector facetsCollector = performSearch(iParams, tr, ir, searcher); // Obtain facets results and hand-test them assertCorrectResults(facetsCollector); assertPostingListExists("$facets", "$fulltree$", ir); assertPostingListExists("$music", "Bands", ir); assertPostingListExists("$music", "Composers", ir); tr.close(); ir.close(); iw.close(); tw.close(); IOUtils.close(dirs[0]); } private void assertPostingListExists(String field, String text, IndexReader ir) throws IOException { DocsEnum de = _TestUtil.docs(random(), ir, field, new BytesRef(text), null, null, 0); assertTrue(de.nextDoc() != DocIdSetIterator.NO_MORE_DOCS); } @Test public void testDifferentFieldsAndText() throws Exception { Directory[][] dirs = getDirs(); // create and open an index writer RandomIndexWriter iw = new RandomIndexWriter(random(), dirs[0][0], newIndexWriterConfig( TEST_VERSION_CURRENT, new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false))); // create and open a taxonomy writer TaxonomyWriter tw = new DirectoryTaxonomyWriter(dirs[0][1], OpenMode.CREATE); PerDimensionIndexingParams iParams = new PerDimensionIndexingParams(); iParams.addCategoryListParams(new CategoryPath("Band"), new CategoryListParams(new Term("$bands", "Bands"))); iParams.addCategoryListParams(new CategoryPath("Composer"), new CategoryListParams(new Term("$composers", "Composers"))); seedIndex(iw, tw, iParams); IndexReader ir = iw.getReader(); tw.commit(); // prepare index reader and taxonomy. TaxonomyReader tr = new DirectoryTaxonomyReader(dirs[0][1]); // prepare searcher to search against IndexSearcher searcher = newSearcher(ir); FacetsCollector facetsCollector = performSearch(iParams, tr, ir, searcher); // Obtain facets results and hand-test them assertCorrectResults(facetsCollector); assertPostingListExists("$facets", "$fulltree$", ir); assertPostingListExists("$bands", "Bands", ir); assertPostingListExists("$composers", "Composers", ir); tr.close(); ir.close(); iw.close(); tw.close(); IOUtils.close(dirs[0]); } @Test public void testSomeSameSomeDifferent() throws Exception { Directory[][] dirs = getDirs(); // create and open an index writer RandomIndexWriter iw = new RandomIndexWriter(random(), dirs[0][0], newIndexWriterConfig( TEST_VERSION_CURRENT, new MockAnalyzer(random(), MockTokenizer.WHITESPACE, false))); // create and open a taxonomy writer TaxonomyWriter tw = new DirectoryTaxonomyWriter(dirs[0][1], OpenMode.CREATE); PerDimensionIndexingParams iParams = new PerDimensionIndexingParams(); iParams.addCategoryListParams(new CategoryPath("Band"), new CategoryListParams(new Term("$music", "music"))); iParams.addCategoryListParams(new CategoryPath("Composer"), new CategoryListParams(new Term("$music", "music"))); iParams.addCategoryListParams(new CategoryPath("Author"), new CategoryListParams(new Term("$literature", "Authors"))); seedIndex(iw, tw, iParams); IndexReader ir = iw.getReader(); tw.commit(); // prepare index reader and taxonomy. TaxonomyReader tr = new DirectoryTaxonomyReader(dirs[0][1]); // prepare searcher to search against IndexSearcher searcher = newSearcher(ir); FacetsCollector facetsCollector = performSearch(iParams, tr, ir, searcher); // Obtain facets results and hand-test them assertCorrectResults(facetsCollector); assertPostingListExists("$music", "music", ir); assertPostingListExists("$literature", "Authors", ir); tr.close(); ir.close(); iw.close(); tw.close(); IOUtils.close(dirs[0]); } private Directory[][] getDirs() { return FacetTestUtils.createIndexTaxonomyDirs(1); } private void assertCorrectResults(FacetsCollector facetsCollector) throws IOException { List<FacetResult> res = facetsCollector.getFacetResults(); FacetResult results = res.get(0); FacetResultNode resNode = results.getFacetResultNode(); Iterable<? extends FacetResultNode> subResults = resNode .getSubResults(); Iterator<? extends FacetResultNode> subIter = subResults.iterator(); checkResult(resNode, "Band", 5.0); checkResult(subIter.next(), "Band/Rock & Pop", 4.0); checkResult(subIter.next(), "Band/Punk", 1.0); results = res.get(1); resNode = results.getFacetResultNode(); subResults = resNode.getSubResults(); subIter = subResults.iterator(); checkResult(resNode, "Band", 5.0); checkResult(subIter.next(), "Band/Rock & Pop", 4.0); checkResult(subIter.next(), "Band/Rock & Pop/Dave Matthews Band", 1.0); checkResult(subIter.next(), "Band/Rock & Pop/REM", 1.0); checkResult(subIter.next(), "Band/Rock & Pop/U2", 1.0); checkResult(subIter.next(), "Band/Punk/The Ramones", 1.0); checkResult(subIter.next(), "Band/Punk", 1.0); checkResult(subIter.next(), "Band/Rock & Pop/The Beatles", 1.0); results = res.get(2); resNode = results.getFacetResultNode(); subResults = resNode.getSubResults(); subIter = subResults.iterator(); checkResult(resNode, "Author", 3.0); checkResult(subIter.next(), "Author/Kurt Vonnegut", 1.0); checkResult(subIter.next(), "Author/Stephen King", 1.0); checkResult(subIter.next(), "Author/Mark Twain", 1.0); results = res.get(3); resNode = results.getFacetResultNode(); subResults = resNode.getSubResults(); subIter = subResults.iterator(); checkResult(resNode, "Band/Rock & Pop", 4.0); checkResult(subIter.next(), "Band/Rock & Pop/Dave Matthews Band", 1.0); checkResult(subIter.next(), "Band/Rock & Pop/REM", 1.0); checkResult(subIter.next(), "Band/Rock & Pop/U2", 1.0); checkResult(subIter.next(), "Band/Rock & Pop/The Beatles", 1.0); } private FacetsCollector performSearch(FacetIndexingParams iParams, TaxonomyReader tr, IndexReader ir, IndexSearcher searcher) throws IOException { // step 1: collect matching documents into a collector Query q = new MatchAllDocsQuery(); TopScoreDocCollector topDocsCollector = TopScoreDocCollector.create(10, true); // Faceted search parameters indicate which facets are we interested in FacetSearchParams facetSearchParams = new FacetSearchParams(iParams); facetSearchParams.addFacetRequest(new CountFacetRequest( new CategoryPath("Band"), 10)); CountFacetRequest bandDepth = new CountFacetRequest(new CategoryPath( "Band"), 10); bandDepth.setDepth(2); facetSearchParams.addFacetRequest(bandDepth); facetSearchParams.addFacetRequest(new CountFacetRequest( new CategoryPath("Author"), 10)); facetSearchParams.addFacetRequest(new CountFacetRequest( new CategoryPath("Band", "Rock & Pop"), 10)); // perform documents search and facets accumulation FacetsCollector facetsCollector = new FacetsCollector(facetSearchParams, ir, tr); searcher.search(q, MultiCollector.wrap(topDocsCollector, facetsCollector)); return facetsCollector; } private void seedIndex(RandomIndexWriter iw, TaxonomyWriter tw, FacetIndexingParams iParams) throws IOException { FacetTestUtils.add(iParams, iw, tw, "Author", "Mark Twain"); FacetTestUtils.add(iParams, iw, tw, "Author", "Stephen King"); FacetTestUtils.add(iParams, iw, tw, "Author", "Kurt Vonnegut"); FacetTestUtils.add(iParams, iw, tw, "Band", "Rock & Pop", "The Beatles"); FacetTestUtils.add(iParams, iw, tw, "Band", "Punk", "The Ramones"); FacetTestUtils.add(iParams, iw, tw, "Band", "Rock & Pop", "U2"); FacetTestUtils.add(iParams, iw, tw, "Band", "Rock & Pop", "REM"); FacetTestUtils.add(iParams, iw, tw, "Band", "Rock & Pop", "Dave Matthews Band"); FacetTestUtils.add(iParams, iw, tw, "Composer", "Bach"); } private static void checkResult(FacetResultNode sub, String label, double value) { assertEquals("Label of subresult " + sub.getLabel() + " was incorrect", label, sub.getLabel().toString()); assertEquals( "Value for " + sub.getLabel() + " subresult was incorrect", value, sub.getValue(), 0.0); } }