/**
* Copyright 2008 The University of North Carolina at Chapel Hill
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package edu.unc.lib.dl.data.ingest.solr.filter;
import static edu.unc.lib.dl.data.ingest.solr.filter.SetDescriptiveMetadataFilter.AFFIL_URI;
import static edu.unc.lib.dl.test.TestHelpers.setField;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNotNull;
import static org.junit.Assert.assertNull;
import static org.junit.Assert.assertTrue;
import static org.mockito.Matchers.any;
import static org.mockito.Mockito.when;
import static org.mockito.MockitoAnnotations.initMocks;
import java.io.File;
import java.io.FileInputStream;
import java.util.Arrays;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import org.jdom2.Document;
import org.jdom2.Element;
import org.jdom2.input.SAXBuilder;
import org.junit.Before;
import org.junit.Test;
import org.mockito.Mock;
import edu.unc.lib.dl.data.ingest.solr.indexing.DocumentIndexingPackage;
import edu.unc.lib.dl.data.ingest.solr.indexing.DocumentIndexingPackageDataLoader;
import edu.unc.lib.dl.data.ingest.solr.indexing.DocumentIndexingPackageFactory;
import edu.unc.lib.dl.fedora.PID;
import edu.unc.lib.dl.search.solr.model.IndexDocumentBean;
import edu.unc.lib.dl.util.ContentModelHelper.Datastream;
import edu.unc.lib.dl.util.ContentModelHelper.FedoraProperty;
import edu.unc.lib.dl.util.DateTimeUtil;
import edu.unc.lib.dl.util.VocabularyHelperManager;
import edu.unc.lib.dl.xml.FOXMLJDOMUtil;
public class SetDescriptiveMetadataFilterTest {
@Mock
private DocumentIndexingPackageDataLoader loader;
private DocumentIndexingPackageFactory factory;
@Mock
private VocabularyHelperManager vocabManager;
private SetDescriptiveMetadataFilter filter;
Map<String, List<String>> triples;
@Before
public void setup() throws Exception {
initMocks(this);
filter = new SetDescriptiveMetadataFilter();
setField(filter, "vocabManager", vocabManager);
factory = new DocumentIndexingPackageFactory();
factory.setDataLoader(loader);
triples = new HashMap<>();
triples.put(FedoraProperty.label.toString(), Arrays.asList("Label"));
when(loader.loadTriples(any(DocumentIndexingPackage.class))).thenReturn(triples);
}
@Test
public void extractMODS() throws Exception {
DocumentIndexingPackage dip = factory.createDip("uuid:aggregate");
SAXBuilder builder = new SAXBuilder();
Document foxml = builder.build(new FileInputStream(new File(
"src/test/resources/foxml/aggregateSplitDepartments.xml")));
Element mods = FOXMLJDOMUtil.getDatastreamContent(Datastream.MD_DESCRIPTIVE, foxml);
when(loader.loadMDDescriptive(any(DocumentIndexingPackage.class))).thenReturn(mods);
Map<String, List<List<String>>> terms = new HashMap<>();
terms.put(AFFIL_URI, Arrays.asList(Arrays.asList("Department of Biostatistics")));
when(vocabManager.getAuthoritativeForms(any(PID.class), any(Element.class))).thenReturn(terms);
filter.filter(dip);
IndexDocumentBean idb = dip.getDocument();
assertEquals("Judson, Richard", idb.getCreatorSort());
assertEquals(4, idb.getCreator().size());
assertEquals(5, idb.getContributor().size());
assertEquals(1, idb.getDepartment().size());
assertEquals("Department of Biostatistics", idb.getDepartment().get(0));
assertNotNull(idb.getAbstractText());
assertEquals(
"A Comparison of Machine Learning Algorithms for Chemical Toxicity Classification Using a Simulated Multi-Scale Data Model",
idb.getTitle());
assertEquals(1, idb.getOtherTitle().size());
assertEquals("BMC Bioinformatics. 2008 May 19;9(1):241", idb.getCitation());
assertEquals("English", idb.getLanguage().get(0));
assertEquals(DateTimeUtil.parseUTCToDate("2008-05-19T00:00:00.000"), idb.getDateCreated());
assertTrue(idb.getIdentifier().contains("pmpid|18489778"));
assertTrue(idb.getIdentifier().contains("doi|10.1186/1471-2105-9-241"));
assertTrue(idb.getKeyword().contains("text"));
assertTrue(idb.getKeyword().contains("Peer Reviewed"));
assertTrue(idb.getKeyword().contains("2008"));
assertTrue(idb.getSubject().contains("Machine Learning"));
assertEquals(1, idb.getSubject().size());
}
@Test
public void noMODS() throws Exception {
DocumentIndexingPackage dip = factory.createDip("uuid:item");
filter.filter(dip);
IndexDocumentBean idb = dip.getDocument();
assertNull(idb.getCreator());
assertNull(idb.getContributor());
assertNull(idb.getDepartment());
assertNull(idb.getSubject());
assertNull(idb.getIdentifier());
assertNull(idb.getAbstractText());
assertEquals(idb.getId(), dip.getPid().getPid());
assertEquals("Label", idb.getTitle());
}
}