package com.idega.block.websearch.business; import java.io.InputStream; import java.util.List; /** * <p><code>ContentHandler</code> Interface for content handlers. </p> * This class is a part of the websearch webcrawler and search engine block. <br> * It is based on the <a href="http://lucene.apache.org">Lucene</a> java search engine from the Apache group and loosly <br> * from the work of David Duddleston of i2a.com.<br> * * @copyright Idega Software 2002 * @author <a href="mailto:eiki@idega.is">Eirikur Hrafnsson</a> */ public interface ContentHandler { /** * Return author */ public String getAuthor(); /** * Return categories (from META tags) */ public String getCategories(); /** * Return contents */ public String getContents(); /** * Return description (from META tags) */ public String getDescription(); /** * Return META HREF */ public String getHREF(); /** * Return keywords (from META tags) */ public String getKeywords(); /** * Return links */ public List getLinks(); /** * Return published date (from META tag) */ public long getPublished(); /** * Return description (from META tags) */ public boolean getRobotFollow(); /** * Return description (from META tags) */ public boolean getRobotIndex(); /** * Return page title */ public String getTitle(); /** * Parse Content. */ public void parse(InputStream in); }