FeedParser.java example

Explorer

NewsSpeakServer-master
- libs
- src
  - com
    - vn
      - newsspeak
        ArticleParser.java
        ArticleParserFactory.java
        ArticleServlet.java
        Email.java
        ExtractTextXMLHandler.java
        FeaturedSourcesServlet.java
        FeedDataStorePopulator.java
        FeedServlet.java
        MailHandlerServlet.java
        NewsSource.java
        PMF.java
        parsers
        CNNParser.java
        DailyBeastParser.java
        EconomicTimesParser.java
        EngadgetParser.java
        HuffPostParser.java
        IndiaTodayParser.java
        LATimesParser.java
        MashableParser.java
        NYDailyNewsParser.java
        NYTimesParser.java
        ReadWriteWebParser.java
        TOIParser.java
        TechCrunchParser.java
        TheHinduParser.java
        USATodayParser.java
        WSJParser.java
        WashPostParser.java

package it.sauronsoftware.feed4j;

import it.sauronsoftware.feed4j.bean.Feed;

import java.net.URL;

import org.dom4j.Document;
import org.dom4j.DocumentException;
import org.dom4j.io.SAXReader;

/**
 * The feed parser. It can parse RSS 1.0, RSS 2.0, Atom 0.3 and Atom 1.0.
 * 
 * @author Carlo Pelliccia
 */
public class FeedParser {

	/**
	 * Gets the feed from an URL and parses it.
	 * 
	 * @param url
	 *            The feed URL.
	 * @return A Feed object containing the information extracted from the feed.
	 * @throws FeedIOException
	 *             I/O error during conetnts retrieving.
	 * @throws FeedXMLParseException
	 *             The document retrieved is not valid XML.
	 * @throws UnsupportedFeedException
	 *             The XML retrieved does not represents a feed whose kind is
	 *             known by the parser.
	 */
	public static Feed parse(URL url) throws FeedIOException,
			FeedXMLParseException, UnsupportedFeedException {
		try {
			// Esegue il parsing iniziale del documento XML.
			SAXReader saxReader = new SAXReader();
			Document document = saxReader.read(url);
			// Cerca il modulo di interpretazione del feed.
			int code = FeedRecognizer.recognizeFeed(document);
			switch (code) {
			case FeedRecognizer.RSS_1_0:
				return TypeRSS_1_0.feed(url, document);
			case FeedRecognizer.RSS_2_0:
				return TypeRSS_2_0.feed(url, document);
			case FeedRecognizer.ATOM_0_3:
				return TypeAtom_0_3.feed(url, document);
			case FeedRecognizer.ATOM_1_0:
				return TypeAtom_1_0.feed(url, document);
			default:
				throw new UnsupportedFeedException();
			}
		} catch (DocumentException e) {
			throw new FeedXMLParseException(e);
		}
	}

}