/** * Copyright 2014 National University of Ireland, Galway. * * This file is part of the SIREn project. Project and contact information: * * https://github.com/rdelbru/SIREn * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.sindice.siren.search.node; import static org.sindice.siren.analysis.MockSirenToken.node; import static org.sindice.siren.search.AbstractTestSirenScorer.NodeTermQueryBuilder.ntq; import java.io.IOException; import java.util.ArrayList; import org.junit.Test; import org.sindice.siren.analysis.AnyURIAnalyzer; import org.sindice.siren.analysis.TupleAnalyzer; import org.sindice.siren.analysis.AnyURIAnalyzer.URINormalisation; import org.sindice.siren.index.DocsAndNodesIterator; import org.sindice.siren.index.codecs.RandomSirenCodec.PostingsFormatType; import org.sindice.siren.search.AbstractTestSirenScorer; import org.sindice.siren.util.XSDDatatype; public class TestNodeTermScorer extends AbstractTestSirenScorer { @Override protected void configure() throws IOException { this.setAnalyzer(AnalyzerType.TUPLE); // TODO: remove when TupleAnalyzer is no more used final AnyURIAnalyzer uriAnalyzer = new AnyURIAnalyzer(TEST_VERSION_CURRENT); uriAnalyzer.setUriNormalisation(URINormalisation.FULL); ((TupleAnalyzer) analyzer).registerDatatype(XSDDatatype.XSD_ANY_URI.toCharArray(), uriAnalyzer); this.setPostingsFormat(PostingsFormatType.RANDOM); } @Test public void testNextPositionFail() throws Exception { this.addDocument("<http://renaud.delbru.fr/> . "); final NodeTermScorer scorer = (NodeTermScorer) this.getScorer(ntq("renaud")); assertFalse(scorer.nextPosition()); } @Test public void testNextNodeFail() throws Exception { this.addDocument("<http://renaud.delbru.fr/> . "); final NodeScorer scorer = this.getScorer(ntq("renaud")); assertFalse(scorer.nextNode()); } @Test public void testLevelConstraint() throws Exception { this.addDocument("<http://renaud.delbru.fr/> . "); NodeScorer scorer = this.getScorer(ntq("renaud").level(1)); assertTrue(scorer.nextCandidateDocument()); assertEquals(0, scorer.doc()); assertFalse(scorer.nextNode()); scorer = this.getScorer(ntq("renaud").level(3)); assertTrue(scorer.nextCandidateDocument()); assertEquals(0, scorer.doc()); assertFalse(scorer.nextNode()); scorer = this.getScorer(ntq("renaud").level(2)); assertTrue(scorer.nextCandidateDocument()); assertEquals(0, scorer.doc()); assertTrue(scorer.nextNode()); assertEquals(node(0,0), scorer.node()); } @Test public void testIntervalConstraint() throws Exception { this.addDocument("<http://renaud.delbru.fr/> . "); NodeScorer scorer = this.getScorer(ntq("renaud").bound(1,1)); assertTrue(scorer.nextCandidateDocument()); assertEquals(0, scorer.doc()); assertFalse(scorer.nextNode()); scorer = this.getScorer(ntq("renaud").bound(1,2)); assertTrue(scorer.nextCandidateDocument()); assertEquals(0, scorer.doc()); assertFalse(scorer.nextNode()); scorer = this.getScorer(ntq("renaud").bound(0,0)); assertTrue(scorer.nextCandidateDocument()); assertEquals(0, scorer.doc()); assertTrue(scorer.nextNode()); assertEquals(node(0,0), scorer.node()); } @Test public void testNextPositionWithURI() throws Exception { this.addDocument("<http://renaud.delbru.fr/> <http://renaud.delbru.fr/> . "); NodeTermScorer scorer = (NodeTermScorer) this.getScorer(ntq("renaud")); assertTrue(scorer.nextCandidateDocument()); assertEquals(0, scorer.doc()); assertEquals(node(-1), scorer.node()); assertEquals(-1, scorer.pos()); assertTrue(scorer.nextNode()); assertEquals(node(0,0), scorer.node()); assertEquals(-1, scorer.pos()); assertTrue(scorer.nextPosition()); assertEquals(0, scorer.pos()); assertTrue(scorer.nextNode()); assertEquals(node(0,1), scorer.node()); assertEquals(-1, scorer.pos()); assertTrue(scorer.nextPosition()); assertEquals(0, scorer.pos()); assertEndOfStream(scorer); this.deleteAll(); this.addDocument("<http://renaud.delbru.fr/> <http://test/name> \"Renaud Delbru\" . "); scorer = (NodeTermScorer) this.getScorer(ntq("renaud")); assertTrue(scorer.nextCandidateDocument()); assertEquals(0, scorer.doc()); assertEquals(node(-1), scorer.node()); assertEquals(-1, scorer.pos()); assertTrue(scorer.nextNode()); assertEquals(node(0,0), scorer.node()); assertEquals(-1, scorer.pos()); assertTrue(scorer.nextPosition()); assertEquals(0, scorer.pos()); assertTrue(scorer.nextNode()); assertEquals(node(0,2), scorer.node()); assertEquals(-1, scorer.pos()); assertTrue(scorer.nextPosition()); assertEquals(0, scorer.pos()); assertEndOfStream(scorer); } @Test public void testSkipToEntity() throws Exception { final ArrayList<String> docs = new ArrayList<String>(); for (int i = 0; i < 32; i++) { docs.add("<http://renaud.delbru.fr/> . \"renaud delbru\" \"renaud delbru\" . "); } this.addDocuments(docs); final NodeTermScorer scorer = (NodeTermScorer) this.getScorer(ntq("renaud")); assertTrue(scorer.skipToCandidate(16)); assertEquals(16, scorer.doc()); assertEquals(node(-1), scorer.node()); assertEquals(-1, scorer.pos()); } @Test public void testSkipToNonExistingDocument() throws Exception { final ArrayList<String> docs = new ArrayList<String>(); for (int i = 0; i < 32; i++) { docs.add("<http://renaud.delbru.fr/> . \"renaud delbru\" \"renaud delbru\" . "); docs.add("<aaa> . \"aaa\" \"aaa bbb\" . "); } this.deleteAll(); this.addDocuments(docs); final NodeTermScorer scorer = (NodeTermScorer) this.getScorer(ntq("renaud")); // does not exist, should skip to entity 18 assertTrue(scorer.skipToCandidate(17)); assertEquals(18, scorer.doc()); assertEquals(node(-1), scorer.node()); assertTrue(scorer.nextNode()); assertEquals(node(0, 0), scorer.node()); assertEquals(-1, scorer.pos()); assertTrue(scorer.nextPosition()); assertEquals(0, scorer.pos()); assertFalse(scorer.skipToCandidate(76)); assertEndOfStream(scorer); } @Test public void testSkipToWithConstraint() throws Exception { final ArrayList<String> docs = new ArrayList<String>(); for (int i = 0; i < 32; i++) { docs.add("<http://renaud.delbru.fr/> . \"renaud delbru\" \"renaud delbru\" . "); docs.add("<aaa> . \"aaa\" \"aaa bbb\" . "); } this.deleteAll(); this.addDocuments(docs); NodeScorer scorer = this.getScorer( ntq("renaud").bound(1,1) ); // does not exist, should skip to entity 18 assertTrue(scorer.skipToCandidate(17)); assertEquals(18, scorer.doc()); assertEquals(node(-1), scorer.node()); assertTrue(scorer.nextNode()); assertEquals(node(1,1), scorer.node()); assertFalse(scorer.skipToCandidate(76)); assertEndOfStream(scorer); scorer = this.getScorer( ntq("renaud").bound(1,1).level(2) ); // does not exist, should skip to entity 18 assertTrue(scorer.skipToCandidate(17)); assertEquals(18, scorer.doc()); assertEquals(node(-1), scorer.node()); assertTrue(scorer.nextNode()); assertEquals(node(1,1), scorer.node()); scorer = this.getScorer( ntq("renaud").bound(1,1).level(1) ); // does not exist, should skip to entity 18 assertTrue(scorer.skipToCandidate(17)); assertEquals(18, scorer.doc()); assertEquals(node(-1), scorer.node()); assertFalse(scorer.nextNode()); assertEquals(DocsAndNodesIterator.NO_MORE_NOD, scorer.node()); scorer = this.getScorer( ntq("renaud").bound(4,7) ); // does not exist, should skip to entity 18 assertTrue(scorer.skipToCandidate(17)); assertEquals(18, scorer.doc()); assertEquals(node(-1), scorer.node()); assertFalse(scorer.nextNode()); assertEquals(DocsAndNodesIterator.NO_MORE_NOD, scorer.node()); } @Test(expected=Exception.class) public void testInvalidScoreCall() throws IOException { this.addDocument("\"Renaud\" . "); final NodeScorer scorer = this.getScorer(ntq("renaud")); // Invalid call scorer.scoreInNode(); } @Test public void testScore() throws IOException { this.addDocument("\"Renaud renaud\" \"renaud\" . "); final LuceneProxyNodeScorer scorer = new LuceneProxyNodeScorer(this.getScorer(ntq("renaud"))); assertTrue(scorer.nextDoc() != DocsAndNodesIterator.NO_MORE_DOC); assertEquals(0, scorer.docID()); assertEquals(3.0, scorer.freq(), 0.01); final float score = scorer.score(); assertFalse(score + " != " + 0, score == 0); } }