package eu.europeana.cloud.service.dps.storm.transform.text.txt;
import eu.europeana.cloud.service.dps.storm.transform.text.MethodsEnumeration;
import eu.europeana.cloud.service.dps.storm.transform.text.TextExtractor;
import java.io.IOException;
import java.io.InputStream;
import java.util.Map;
import org.apache.commons.io.IOUtils;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
/**
* Text extractor for TXT files that only read the file.
* @author Pavel Kefurt <Pavel.Kefurt@gmail.com>
*/
public class ReadFileExtractor implements TextExtractor
{
private static final Logger LOGGER = LoggerFactory.getLogger(ReadFileExtractor.class);
@Override
public String extractText(InputStream is)
{
if(is == null)
{
return null;
}
try
{
return IOUtils.toString(is);
}
catch (IOException ex)
{
LOGGER.warn("Can not read text from txt file because: " + ex.getMessage());
return null;
}
}
@Override
public MethodsEnumeration getExtractionMethod()
{
return TxtExtractionMethods.READ_FILE_EXTRACTOR;
}
@Override
public Map<String, String> getExtractedMetadata()
{
return null;
}
@Override
public String getRepresentationName()
{
return "txt";
}
}