/**
* Copyright 2008 - 2009 Pro-Netics S.P.A.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package it.pronetics.madstore.crawler.impl;
import it.pronetics.madstore.crawler.Pipeline;
import it.pronetics.madstore.crawler.downloader.Downloader;
import it.pronetics.madstore.crawler.parser.Parser;
import it.pronetics.madstore.crawler.publisher.AtomPublisher;
/**
* Factory interface for creating specific {@link CrawlerTask} implementations.
*
* @author Sergio Bossa
*/
public interface CrawlerTaskFactory {
/**
* Make and configure a fresh crawler task instance.
*
* @param downloader The {@link it.pronetics.madstore.crawler.downloader.Downloader} to use for downloading web pages.
* @param parser The {@link it.pronetics.madstore.crawler.parser.Parser} to use for parsing web pages.
* @param publisher The {@link it.pronetics.madstore.crawler.publisher.AtomPublisher} to use for publishing Atom contents to repositories.
* @param pipeline The {@link it.pronetics.madstore.crawler.Pipeline} to use for processing web pages.
* @param maxConcurrentDownloads The max number of concurrent page downloads on a single target site.
* @param maxVisitedLinks The max number of visited links on a single target site.
* @return The crawler task instance.
*/
public CrawlerTask makeCrawlerTask(Downloader downloader, Parser parser, AtomPublisher publisher, Pipeline pipeline, int maxConcurrentDownloads, int maxVisitedLinks);
}