/* $Id$ */ /** * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ package org.apache.manifoldcf.crawler.connectors.rss; /** Constants for the RSS connector configuration. */ public class RSSConfig { public static final String _rcsid = "@(#)$Id$"; // Constants describing the configuration structure. This structure describes the "how" of // fetching page data - e.g. bandwidth and fetch constraints, adherance to robots conventions, // etc. // For the throttling part of the connector, the scheduler handles average fetch-rate limits. // The per-connection configuration describes the maximum number of connections per some user-defined criteria, as // well as bandwidth maximums and fetch rate absolute maximums. // // Parameters /** Robots usage parameter */ public static final String PARAMETER_ROBOTSUSAGE = "Robots usage"; /** Email parameter */ public static final String PARAMETER_EMAIL = "Email address"; /** Max kilobytes per second per server */ public static final String PARAMETER_BANDWIDTH = "KB per second"; /** Max simultaneous open connections per server */ public static final String PARAMETER_MAXOPEN = "Max server connections"; /** Max fetches per minute per server */ public static final String PARAMETER_MAXFETCHES = "Max fetches per minute"; /** The throttle group name */ public static final String PARAMETER_THROTTLEGROUP = "Throttle group"; /** Proxy host name */ public static final String PARAMETER_PROXYHOST = "Proxy host"; /** Proxy port */ public static final String PARAMETER_PROXYPORT = "Proxy port"; /** Proxy auth domain */ public static final String PARAMETER_PROXYAUTHDOMAIN = "Proxy authentication domain"; /** Proxy auth username */ public static final String PARAMETER_PROXYAUTHUSERNAME = "Proxy authentication user name"; /** Proxy auth password */ public static final String PARAMETER_PROXYAUTHPASSWORD = "Proxy authentication password"; // Constants used in the document specification part of the configuration structure. // This describes the "what" of the job. /** Feed specification node. Has one attribute, 'url'. */ public static final String NODE_FEED = "feed"; /** Map entry specification node. Has two attributes: 'match' and 'map'. */ public static final String NODE_MAP = "map"; /** Feed timeout. Attribute = 'value' */ public static final String NODE_FEEDTIMEOUT = "feedtimeout"; /** Feed rescan time. Attribute = 'value' */ public static final String NODE_FEEDRESCAN = "feedrescan"; /** Min feed rescan time. Attribute = 'value' */ public static final String NODE_MINFEEDRESCAN = "minfeedrescan"; /** Bad feed rescan time. Attribute = 'value' */ public static final String NODE_BADFEEDRESCAN = "badfeedrescan"; /** Access node (forced ACLs). Attribute is 'token' */ public static final String NODE_ACCESS = "access"; /** Dechromed mode. Attribute is 'mode' */ public static final String NODE_DECHROMEDMODE = "dechromedmode"; /** Chromed mode. Attribute is 'mode' */ public static final String NODE_CHROMEDMODE = "chromedmode"; /** Url normalization specification; attrs are 'regexp', 'description', 'reorder', * 'javasessionremoval', 'aspsessionremoval', 'bvsessionremoval', 'phpsessionremoval' */ public static final String NODE_URLSPEC = "urlspec"; /** Exclude regexps node. The value of this node contains the regexps that * if any one matches, causes the URL to be excluded from the crawl. These * regexps are newline separated, and # starts a comment. */ public static final String NODE_EXCLUDES = "excludes"; // Attributes /** Url attribute */ public static final String ATTR_URL = "url"; /** Value attribute */ public static final String ATTR_VALUE = "value"; /** Name attribute */ public static final String ATTR_NAME = "name"; /** Token attribute */ public static final String ATTR_TOKEN = "token"; /** Mode attribute */ public static final String ATTR_MODE = "mode"; /** Regexp attribute */ public static final String ATTR_REGEXP = "regexp"; /** Description attribute */ public static final String ATTR_DESCRIPTION = "description"; /** Reorder attribute */ public static final String ATTR_REORDER = "reorder"; /** Javasessionremoval attribute */ public static final String ATTR_JAVASESSIONREMOVAL = "javasessionremoval"; /** Aspsessionremoval attribute */ public static final String ATTR_ASPSESSIONREMOVAL = "aspsessionremoval"; /** Phpsessionremoval attribute */ public static final String ATTR_PHPSESSIONREMOVAL = "phpsessionremoval"; /** Bvsessionremoval attribute */ public static final String ATTR_BVSESSIONREMOVAL = "bvsessionremoval"; /** Match attribute */ public static final String ATTR_MATCH = "match"; /** Map attribute */ public static final String ATTR_MAP = "map"; // Values // Robots usage values /** All */ public static final String VALUE_ALL = "all"; /** None */ public static final String VALUE_NONE = "none"; /** Data */ public static final String VALUE_DATA = "data"; // Dechromedmode mode values /** None */ //public static final String VALUE_NONE = "none"; /** Description */ public static final String VALUE_DESCRIPTION = "description"; /** Content */ public static final String VALUE_CONTENT = "content"; // Chromedmode mode values /** Use */ public static final String VALUE_USE = "use"; /** Skip */ public static final String VALUE_SKIP = "skip"; /** Metadata */ public static final String VALUE_METADATA = "metadata"; // Yes/no /** No */ public static final String VALUE_NO = "no"; /** Yes */ public static final String VALUE_YES = "yes"; }