/*
* (c) Copyright 2008-2011 by Volker Bergmann. All rights reserved.
*
* Redistribution and use in source and binary forms, with or without
* modification, is permitted under the terms of the
* GNU General Public License.
*
* For redistributing this software or a derivative work under a license other
* than the GPL-compatible Free Software License as defined by the Free
* Software Foundation or approved by OSI, you must first obtain a commercial
* license to this software product from Volker Bergmann.
*
* THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS "AS IS"
* WITHOUT A WARRANTY OF ANY KIND. ALL EXPRESS OR IMPLIED CONDITIONS,
* REPRESENTATIONS AND WARRANTIES, INCLUDING ANY IMPLIED WARRANTY OF
* MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE OR NON-INFRINGEMENT, ARE
* HEREBY EXCLUDED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR CONTRIBUTORS BE
* LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR
* CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF
* SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS
* INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN
* CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE)
* ARISING IN ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE
* POSSIBILITY OF SUCH DAMAGE.
*/
package org.databene.benerator.csv;
import java.util.List;
import org.databene.benerator.WeightedGenerator;
import org.databene.benerator.dataset.AbstractDatasetGenerator;
import org.databene.benerator.dataset.AtomicDatasetGenerator;
import org.databene.benerator.dataset.Dataset;
import org.databene.benerator.dataset.DatasetUtil;
import org.databene.benerator.sample.AttachedWeightSampleGenerator;
import org.databene.commons.Converter;
import org.databene.commons.IOUtil;
import org.databene.commons.SystemInfo;
import org.databene.commons.converter.NoOpConverter;
import org.databene.script.WeightedSample;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
/**
* Generates data from a csv file set that is organized as {@link Dataset}.
* For different regions, different CSV versions may be provided by appending region suffixes,
* similar to the JDK ResourceBundle handling.<br/>
* <br/>
* Created: 21.03.2008 16:32:04
* @since 0.5.0
* @author Volker Bergmann
*/
public class WeightedDatasetCSVGenerator<E> extends AbstractDatasetGenerator<E> {
private static final Logger LOGGER = LoggerFactory.getLogger(WeightedDatasetCSVGenerator.class);
protected String filenamePattern;
protected String encoding;
protected char separator;
protected Converter<String, E> converter;
// constructors ----------------------------------------------------------------------------------------------------
public WeightedDatasetCSVGenerator(Class<E> generatedType, String filenamePattern, String datasetName, String nesting, boolean fallback) {
this(generatedType, filenamePattern, ',', datasetName, nesting, fallback, SystemInfo.getFileEncoding());
}
@SuppressWarnings({ "unchecked", "cast", "rawtypes" })
public WeightedDatasetCSVGenerator(Class<E> generatedType, String filenamePattern, char separator, String datasetName, String nesting, boolean fallback, String encoding) {
this(generatedType, filenamePattern, separator, datasetName, nesting, fallback, encoding, (Converter<String, E>) new NoOpConverter());
}
@SuppressWarnings({ "cast", "unchecked", "rawtypes" })
public WeightedDatasetCSVGenerator(Class<E> generatedType, String filenamePattern, String datasetName, String nesting, boolean fallback, String encoding) {
this(generatedType, filenamePattern, ',', datasetName, nesting, fallback, encoding, (Converter<String, E>) new NoOpConverter());
}
public WeightedDatasetCSVGenerator(Class<E> generatedType, String filenamePattern, char separator, String datasetName, String nesting, boolean fallback,
String encoding, Converter<String, E> converter) {
super(generatedType, nesting, datasetName, fallback);
this.filenamePattern = filenamePattern;
this.separator = separator;
this.encoding = encoding;
this.converter = converter;
}
// properties ------------------------------------------------------------------------------------------------------
public void setFilenamePattern(String filenamePattern) {
this.filenamePattern = filenamePattern;
}
public String getFilenamePattern() {
return filenamePattern;
}
@Override
protected WeightedGenerator<E> createGeneratorForAtomicDataset(Dataset dataset) {
String filename = DatasetUtil.filenameOfDataset(dataset.getName(), filenamePattern);
LOGGER.debug("Creating weighted data set CSV generator for file {}", filename);
if (IOUtil.isURIAvailable(filename)) {
List<WeightedSample<E>> samples = CSVGeneratorUtil.parseFile(filename, separator, encoding, converter);
AttachedWeightSampleGenerator<E> generator = new AttachedWeightSampleGenerator<E>(generatedType);
for (WeightedSample<E> sample : samples)
generator.addSample(sample.getValue(), sample.getWeight());
if (samples.size() > 0)
return new AtomicDatasetGenerator<E>(generator, filename, dataset.getName());
}
return null;
}
// java.lang.Object overrides --------------------------------------------------------------------------------------
@Override
public String toString() {
return getClass().getSimpleName() + '[' + filenamePattern + ',' + nesting + ':' + datasetName + ']';
}
}