/* * Seldon -- open source prediction engine * ======================================= * Copyright 2011-2015 Seldon Technologies Ltd and Rummble Ltd (http://www.seldon.io/) * ********************************************************************************************** * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. * ********************************************************************************************** */ package io.seldon.importer.articles.dynamicextractors; import static org.easymock.EasyMock.*; import static org.junit.Assert.assertEquals; import static org.junit.Assert.assertNull; import io.seldon.importer.articles.dynamicextractors.AttributeDetail; import io.seldon.importer.articles.dynamicextractors.MultiSelectorDynamicExtractor; import io.seldon.importer.articles.dynamicextractors.AttributeDetail.SubExtractor; import java.util.ArrayList; import java.util.Arrays; import org.jsoup.nodes.Document; import org.jsoup.nodes.Element; import org.jsoup.select.Elements; import org.junit.Test; public class TestMultiSelectorDynamicExtractor { @Test public void shouldFailIfNoSelectorsMatch() throws Exception{ Document document = createMock(Document.class); MultiSelectorDynamicExtractor extr = new MultiSelectorDynamicExtractor(); AttributeDetail attrDetail = new AttributeDetail(); attrDetail.sub_types = new ArrayList<SubExtractor>(); assertNull(extr.extract(attrDetail, null, document)); replay(document); verify(document); } @Test public void shouldOnlyRunFirstExtractorIfItGetsAMatch() throws Exception { Document document = createMock(Document.class); Elements elements = createMock(Elements.class); Element element = createMock(Element.class); MultiSelectorDynamicExtractor extr = new MultiSelectorDynamicExtractor(); AttributeDetail attrDetail = new AttributeDetail(); SubExtractor extr1 = new SubExtractor(); SubExtractor extr2 = new SubExtractor(); extr1.extractor_type = "FirstElementTextValue"; extr1.extractor_args = Arrays.asList("selector"); extr2.extractor_type = "FirstElementTextValue"; extr2.extractor_args = Arrays.asList("selector2"); attrDetail.sub_types = Arrays.asList(extr1, extr2); expect(document.select("selector")).andReturn(elements); expect(elements.first()).andReturn(element); expect(element.text()).andReturn("notEmpty"); replay(document, elements, element); assertEquals("notEmpty",extr.extract(attrDetail, null, document)); verify(document, elements, element); } @Test public void shouldRunSecondExtractorIfFirstDoesntMatch() throws Exception { Document document = createMock(Document.class); Elements elements = createMock(Elements.class); Element element = createMock(Element.class); Elements elements2 = createMock(Elements.class); Element element2 = createMock(Element.class); MultiSelectorDynamicExtractor extr = new MultiSelectorDynamicExtractor(); AttributeDetail attrDetail = new AttributeDetail(); SubExtractor extr1 = new SubExtractor(); SubExtractor extr2 = new SubExtractor(); extr1.extractor_type = "FirstElementTextValue"; extr1.extractor_args = Arrays.asList("selector"); extr2.extractor_type = "FirstElementTextValue"; extr2.extractor_args = Arrays.asList("selector2"); attrDetail.sub_types = Arrays.asList(extr1, extr2); expect(document.select("selector")).andReturn(elements); expect(elements.first()).andReturn(element); expect(element.text()).andReturn(""); expect(document.select("selector2")).andReturn(elements2); expect(elements2.first()).andReturn(element2); expect(element2.text()).andReturn("notEmpty"); replay(document, elements, element, elements2, element2); assertEquals("notEmpty",extr.extract(attrDetail, null, document)); verify(document, elements, element, elements2, element2); } }