package uk.ac.shef.dcs.jate.io; import uk.ac.shef.dcs.jate.JATEException; import uk.ac.shef.dcs.jate.model.JATEDocument; import java.io.File; /** * Created by zqz on 15/09/2015. */ public class TikaSimpleDocumentCreator extends DocumentCreator { protected ContentExtractor contentExtractor; public TikaSimpleDocumentCreator() { contentExtractor = new ContentExtractor(); } public JATEDocument create(String source) throws JATEException { File file = new File(source); JATEDocument doc = new JATEDocument(source); doc.setPath(source); String content = contentExtractor.extractContent(file); doc.setContent(content); return doc; } @Override public DocumentCreator copy() { return new TikaSimpleDocumentCreator(); } }