/** * Copyright 2014 National University of Ireland, Galway. * * This file is part of the SIREn project. Project and contact information: * * https://github.com/rdelbru/SIREn * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.sindice.siren.search.node; import static org.sindice.siren.analysis.MockSirenToken.node; import static org.sindice.siren.search.AbstractTestSirenScorer.BooleanClauseBuilder.should; import static org.sindice.siren.search.AbstractTestSirenScorer.NodeBooleanQueryBuilder.nbq; import java.io.IOException; import java.util.ArrayList; import org.junit.Test; import org.sindice.siren.analysis.AnyURIAnalyzer; import org.sindice.siren.analysis.TupleAnalyzer; import org.sindice.siren.analysis.AnyURIAnalyzer.URINormalisation; import org.sindice.siren.index.DocsAndNodesIterator; import org.sindice.siren.index.codecs.RandomSirenCodec.PostingsFormatType; import org.sindice.siren.search.AbstractTestSirenScorer; import org.sindice.siren.util.XSDDatatype; public class TestNodeDisjunctionScorer extends AbstractTestSirenScorer { @Override protected void configure() throws IOException { this.setAnalyzer(AnalyzerType.TUPLE); // TODO: remove when TupleAnalyzer is no more used final AnyURIAnalyzer uriAnalyzer = new AnyURIAnalyzer(TEST_VERSION_CURRENT); uriAnalyzer.setUriNormalisation(URINormalisation.FULL); ((TupleAnalyzer) analyzer).registerDatatype(XSDDatatype.XSD_ANY_URI.toCharArray(), uriAnalyzer); this.setPostingsFormat(PostingsFormatType.RANDOM); } @Test public void testNextCandidateNextNode() throws Exception { this.addDocuments( "<http://renaud.delbru.fr/> . ", "<http://sindice.com/test/name> \"Renaud Delbru\" . ", "<http://sindice.com/test/type> <http://sindice.com/test/Person> . ", "<aaa> <bbb> . <http://sindice.com/test/name> \"R. Delbru\" . " ); final NodeScorer scorer = this.getScorer( nbq(should("renaud"), should("delbru")) ); assertTrue(scorer.nextCandidateDocument()); assertEquals(0, scorer.doc()); assertEquals(node(-1), scorer.node()); assertTrue(scorer.nextNode()); assertEquals(node(0,0), scorer.node()); final float d0score00 = scorer.scoreInNode(); final float d0freq00 = scorer.freqInNode(); assertFalse(scorer.nextNode()); assertEquals(DocsAndNodesIterator.NO_MORE_NOD, scorer.node()); assertTrue(scorer.nextCandidateDocument()); assertEquals(1, scorer.doc()); assertEquals(node(-1), scorer.node()); assertTrue(scorer.nextNode()); assertEquals(node(0,1), scorer.node()); final float d1score01 = scorer.scoreInNode(); final float d1freq01 = scorer.freqInNode(); assertEquals(d0freq00, d1freq01, 0); assertFalse(scorer.nextNode()); assertEquals(DocsAndNodesIterator.NO_MORE_NOD, scorer.node()); assertTrue(scorer.nextCandidateDocument()); assertEquals(3, scorer.doc()); assertEquals(node(-1), scorer.node()); assertTrue(scorer.nextNode()); assertEquals(node(1,1), scorer.node()); // only one term is matched in the node final float d3score11 = scorer.scoreInNode(); final float d3freq11 = scorer.freqInNode(); assertTrue(d0freq00 > d3freq11); assertTrue(d1freq01 > d3freq11); assertTrue(d3score11 + " < " + d1score01, d3score11 < d1score01); assertTrue(d3score11 + " < " + d0score00, d3score11 < d0score00); assertFalse(scorer.nextNode()); assertEquals(DocsAndNodesIterator.NO_MORE_NOD, scorer.node()); assertEndOfStream(scorer); } @Test public void testSkipToCandidateNextNode() throws Exception { final ArrayList<String> docs = new ArrayList<String>(); for (int i = 0; i < 16; i++) { docs.add("\"aaa bbb\" \"aaa ccc\" . \"ccc\" \"bbb ccc\" ."); docs.add("\"aaa ccc bbb\" . \"aaa aaa ccc bbb bbb\" . "); } this.addDocuments(docs); final NodeScorer scorer = this.getScorer( nbq(should("aaa"), should("bbb")) ); assertTrue(scorer.nextCandidateDocument()); assertEquals(0, scorer.doc()); assertEquals(node(-1), scorer.node()); assertTrue(scorer.nextNode()); assertEquals(node(0,0), scorer.node()); assertTrue(scorer.skipToCandidate(16)); assertEquals(16, scorer.doc()); assertEquals(node(-1), scorer.node()); assertTrue(scorer.nextNode()); assertEquals(node(0,0), scorer.node()); assertTrue(scorer.nextCandidateDocument()); assertEquals(17, scorer.doc()); assertEquals(node(-1), scorer.node()); assertTrue(scorer.nextNode()); assertEquals(node(0,0), scorer.node()); assertTrue(scorer.skipToCandidate(20)); assertEquals(20, scorer.doc()); assertEquals(node(-1), scorer.node()); assertTrue(scorer.nextNode()); assertEquals(node(0,0), scorer.node()); assertTrue(scorer.nextCandidateDocument()); assertEquals(21, scorer.doc()); assertEquals(node(-1), scorer.node()); assertTrue(scorer.nextNode()); assertEquals(node(0,0), scorer.node()); assertTrue(scorer.skipToCandidate(30)); assertEquals(30, scorer.doc()); assertEquals(node(-1), scorer.node()); assertTrue(scorer.nextNode()); assertEquals(node(0,0), scorer.node()); assertFalse(scorer.skipToCandidate(34)); assertEndOfStream(scorer); } }