/**
* This package contains all classes which are used to save information about a parsed document (e.g. extracted metadata) and the fulltext.
*/
package org.bbaw.wsp.cms.dochandler.parser.document;
import org.bbaw.wsp.cms.document.MetadataRecord;
import org.bbaw.wsp.cms.dochandler.parser.text.parser.ResourceParser;
/**
* This interface gives access to all kinds of parsed documents. Those documents
* were parsed by the {@link ResourceParser} before.
*
* @author Sascha Feldmann (wsp-shk1)
* @date 16.08.2012
*
*/
public interface IDocument {
/**
* Recieve the fulltext of any kind of parsed document as String.
*
* @return the fulltext as String. Never returns null.
*/
String getTextOrig();
/**
* Recieve the URL to a parsed document.
*
* @return the URL as String. Never returns null.
*/
String getURL();
/**
* Fetch the Metadata.
*
* @return {@link MetadataRecord}. May return null if the metadata wasn't set.
*/
MetadataRecord getMetadata();
/**
* Set the {@link MetadataRecord}.
*
* @param metadata
* the {@link MetadataRecord}.
*/
void setMetadata(final MetadataRecord metadata);
}