DwcaCreationIntegrationTest.java example

Explorer
eMonocot-master
/*
 * This is eMonocot, a global online biodiversity information resource.
 *
 * Copyright © 2011–2015 The Board of Trustees of the Royal Botanic Gardens, Kew and The University of Oxford
 *
 * eMonocot is free software: you can redistribute it and/or modify it under the terms of the
 * GNU Affero General Public License as published by the Free Software Foundation, either version 3
 * of the License, or (at your option) any later version.
 *
 * eMonocot is distributed in the hope that it will be useful, but WITHOUT ANY WARRANTY; without even
 * the implied warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU Affero General Public License for more details.
 *
 * The complete text of the GNU Affero General Public License is in the source repository as the file
 * ‘COPYING’.  It is also available from <http://www.gnu.org/licenses/>.
 */
package org.emonocot.job.dwc;

import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNotNull;

import java.io.File;
import java.io.FileInputStream;
import java.util.ArrayList;
import java.util.Collection;
import java.util.HashMap;
import java.util.List;
import java.util.Map;
import java.util.UUID;
import java.util.zip.ZipEntry;
import java.util.zip.ZipInputStream;

import org.apache.solr.client.solrj.SolrServer;
import org.apache.solr.client.solrj.response.QueryResponse;
import org.apache.solr.common.SolrDocumentList;
import org.apache.solr.common.params.ModifiableSolrParams;
import org.emonocot.api.job.DarwinCorePropertyMap;
import org.emonocot.model.Taxon;
import org.emonocot.persistence.hibernate.SolrIndexingListener;
import org.gbif.dwc.terms.Term;
import org.gbif.dwc.terms.DwcTerm;
import org.gbif.dwc.terms.GbifTerm;
import org.hibernate.Session;
import org.hibernate.SessionFactory;
import org.hibernate.Transaction;
import org.junit.After;
import org.junit.Before;
import org.junit.Test;
import org.junit.runner.RunWith;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.springframework.batch.core.ExitStatus;
import org.springframework.batch.core.Job;
import org.springframework.batch.core.JobExecution;
import org.springframework.batch.core.JobParameter;
import org.springframework.batch.core.JobParameters;
import org.springframework.batch.core.configuration.JobLocator;
import org.springframework.batch.core.launch.JobLauncher;
import org.springframework.beans.factory.annotation.Autowired;
import org.springframework.beans.factory.annotation.Qualifier;
import org.springframework.test.annotation.DirtiesContext;
import org.springframework.test.annotation.DirtiesContext.ClassMode;
import org.springframework.test.context.ContextConfiguration;
import org.springframework.test.context.junit4.SpringJUnit4ClassRunner;

/**
 * @author jk00kg
 *
 */
@RunWith(SpringJUnit4ClassRunner.class)
@ContextConfiguration({
	"/META-INF/spring/batch/jobs/darwinCoreArchiveCreator.xml",
	"/META-INF/spring/applicationContext-integration.xml",
"/META-INF/spring/applicationContext-test.xml" })
@DirtiesContext(classMode = ClassMode.AFTER_CLASS)
public class DwcaCreationIntegrationTest {

	Logger logger = LoggerFactory.getLogger(DwcaCreationIntegrationTest.class);

	@Autowired
	private JobLocator jobLocator;

	@Autowired
	@Qualifier("jobLauncher")
	private JobLauncher jobLauncher;

	@Autowired
	private SessionFactory sessionFactory;

	@Autowired SolrServer solrServer;

	@Autowired SolrIndexingListener solrIndexingListener;

	/**
	 * @throws java.lang.Exception
	 */
	@Before
	public void setUp() throws Exception {
		ModifiableSolrParams params = new ModifiableSolrParams();
		params.add("q","*:*");
		params.add("rows",new Integer(Integer.MAX_VALUE).toString());
		params.add("df","id");
		QueryResponse queryResponse = solrServer.query(params);
		SolrDocumentList solrDocumentList = queryResponse.getResults();
		List<String> documentsToDelete = new ArrayList<String>();
		for(int i = 0; i < solrDocumentList.size(); i++) {
			documentsToDelete.add(solrDocumentList.get(i).getFirstValue("id").toString());
		}
		if(!documentsToDelete.isEmpty()) {
			logger.info("Deleting " + documentsToDelete.size());
			solrServer.deleteById(documentsToDelete);
			solrServer.commit(true,true);
		}


		Session session = sessionFactory.openSession();

		Transaction tx = session.beginTransaction();

		List<Taxon> taxa = session.createQuery("from Taxon as taxon").list();
		solrIndexingListener.indexObjects(taxa);
		logger.info("Indexing " + taxa.size());
		tx.commit();
	}

	/**
	 * @throws java.lang.Exception
	 */
	@After
	public void tearDown() throws Exception {
	}

	/**
	 * @throws Exception
	 */
	@Test
	public void testWriteSubsetArchive() throws Exception {
		Map<String, JobParameter> parameters = new HashMap<String, JobParameter>();
		parameters.put("download.query", new JobParameter(""));
		parameters.put("download.selectedFacets", new JobParameter("taxon.family_ss=Araceae,base.class_s=org.emonocot.model.Taxon"));
		parameters.put("download.taxon", new JobParameter(toParameter(DarwinCorePropertyMap.getConceptTerms(DwcTerm.Taxon))));
		parameters.put("download.description", new JobParameter(toParameter(DarwinCorePropertyMap.getConceptTerms(GbifTerm.Description))));
		parameters.put("download.image", new JobParameter(toParameter(DarwinCorePropertyMap.getConceptTerms(GbifTerm.Image))));
		parameters.put("download.distribution", new JobParameter(toParameter(DarwinCorePropertyMap.getConceptTerms(GbifTerm.Distribution))));
		parameters.put("download.reference", new JobParameter(toParameter(DarwinCorePropertyMap.getConceptTerms(GbifTerm.Reference))));
		parameters.put("download.limit", new JobParameter(new Integer(Integer.MAX_VALUE).toString()));
		parameters.put("download.file",new JobParameter(UUID.randomUUID().toString()));
		parameters.put("download.fieldsEnclosedBy", new JobParameter("\""));
		parameters.put("download.fieldsTerminatedBy", new JobParameter("\t"));

		JobParameters jobParameters = new JobParameters(parameters);
		Job archiveCreatorJob = jobLocator.getJob("DarwinCoreArchiveCreation");
		assertNotNull("archiveCreatorJob must exist", archiveCreatorJob);
		JobExecution jobExecution = jobLauncher.run(archiveCreatorJob,
				jobParameters);

		assertEquals("The Job should be sucessful", ExitStatus.COMPLETED, jobExecution.getExitStatus());
		File workingDirectory = new File("target/output");
		File outputFile = new File(workingDirectory,jobParameters.getParameters()
				.get("download.file").getValue().toString() + ".zip");
		ZipInputStream zipStream = new ZipInputStream(new FileInputStream(outputFile));
		assertNotNull("There should be an output file", outputFile);
		logger.info("Zip file created at " + outputFile.getAbsolutePath());

		List<ZipEntry> entries = new ArrayList<ZipEntry>();
		ZipEntry e;
		while((e = zipStream.getNextEntry()) != null){
			entries.add(e);
		}
		assertEquals("There should be 7 files", 7, entries.size());
	}

	/**
	 * @throws Exception
	 */
	@Test
	public void testWriteAllArchive() throws Exception {
		Map<String, JobParameter> parameters = new HashMap<String, JobParameter>();


		parameters.put("download.query", new JobParameter(""));
		parameters.put("download.selectedFacets", new JobParameter("base.class_s=org.emonocot.model.Taxon"));
		parameters.put("download.taxon", new JobParameter(toParameter(DarwinCorePropertyMap.getConceptTerms(DwcTerm.Taxon))));
		parameters.put("download.description", new JobParameter(toParameter(DarwinCorePropertyMap.getConceptTerms(GbifTerm.Description))));
		parameters.put("download.image", new JobParameter(toParameter(DarwinCorePropertyMap.getConceptTerms(GbifTerm.Image))));
		parameters.put("download.distribution", new JobParameter(toParameter(DarwinCorePropertyMap.getConceptTerms(GbifTerm.Distribution))));
		parameters.put("download.reference", new JobParameter(toParameter(DarwinCorePropertyMap.getConceptTerms(GbifTerm.Reference))));
		parameters.put("download.file",new JobParameter(UUID.randomUUID().toString()));
		parameters.put("download.limit", new JobParameter(new Integer(Integer.MAX_VALUE).toString()));
		parameters.put("download.fieldsEnclosedBy", new JobParameter("\""));
		parameters.put("download.fieldsTerminatedBy", new JobParameter("\t"));

		JobParameters jobParameters = new JobParameters(parameters);
		Job archiveCreatorJob = jobLocator.getJob("DarwinCoreArchiveCreation");
		assertNotNull("archiveCreatorJob must exist", archiveCreatorJob);
		JobExecution jobExecution = jobLauncher.run(archiveCreatorJob,
				jobParameters);

		assertEquals("The Job should be sucessful", ExitStatus.COMPLETED, jobExecution.getExitStatus());

		File workingDirectory = new File("target/output");
		File outputFile = new File(workingDirectory,jobParameters.getParameters()
				.get("download.file").getValue().toString() + ".zip");
		ZipInputStream zipStream = new ZipInputStream(new FileInputStream(outputFile));
		assertNotNull("There should be an output file", outputFile);
		logger.info("Zip file created at " + outputFile.getAbsolutePath());

		List<ZipEntry> entries = new ArrayList<ZipEntry>();
		ZipEntry e;
		while((e = zipStream.getNextEntry()) != null){
			entries.add(e);
		}
		assertEquals("There should be 7 files", 7, entries.size());
	}

	private String toParameter(Collection<Term> terms) {

		StringBuffer stringBuffer = new StringBuffer();
		if (terms != null && !terms.isEmpty()) {
			boolean isFirst = true;
			for (Term term : terms) {
				if(!isFirst) {
					stringBuffer.append(",");
				} else {
					isFirst = false;
				}
				stringBuffer.append(term.qualifiedName());
			}
		}
		return stringBuffer.toString();
	}

}