/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.nutchbase.protocol;
import java.net.URL;
import java.net.MalformedURLException;
import java.util.HashSet;
import java.util.Set;
// Commons Logging imports
import org.apache.commons.logging.Log;
import org.apache.commons.logging.LogFactory;
import org.apache.nutch.plugin.*;
import org.apache.nutch.protocol.ProtocolNotFound;
import org.apache.nutch.util.ObjectCache;
import org.apache.hadoop.conf.Configuration;
/**
* Creates and caches {@link Protocol} plugins. Protocol plugins should define
* the attribute "protocolName" with the name of the protocol that they
* implement. Configuration object is used for caching. Cache key is constructed
* from appending protocol name (eg. http) to constant
* {@link Protocol#X_POINT_ID}.
*/
public class ProtocolFactoryHbase {
public static final Log LOG = LogFactory.getLog(ProtocolFactoryHbase.class);
private ExtensionPoint extensionPoint;
private Configuration conf;
public ProtocolFactoryHbase(Configuration conf) {
this.conf = conf;
this.extensionPoint = PluginRepository.get(conf).getExtensionPoint(
ProtocolHbase.X_POINT_ID);
if (this.extensionPoint == null) {
throw new RuntimeException("x-point " + ProtocolHbase.X_POINT_ID
+ " not found.");
}
}
/**
* Returns the appropriate {@link Protocol} implementation for a url.
*
* @param urlString
* Url String
* @return The appropriate {@link Protocol} implementation for a given {@link URL}.
* @throws ProtocolNotFound
* when Protocol can not be found for urlString
*/
public ProtocolHbase getProtocol(String urlString) throws ProtocolNotFound {
ObjectCache objectCache = ObjectCache.get(conf);
try {
URL url = new URL(urlString);
String protocolName = url.getProtocol();
String cacheId = ProtocolHbase.X_POINT_ID + protocolName;
if (protocolName == null)
throw new ProtocolNotFound(urlString);
if (objectCache.getObject(cacheId) != null) {
return (ProtocolHbase) objectCache.getObject(cacheId);
} else {
Extension extension = findExtension(protocolName);
if (extension == null) {
throw new ProtocolNotFound(protocolName);
}
ProtocolHbase protocol = (ProtocolHbase) extension.getExtensionInstance();
objectCache.setObject(cacheId, protocol);
return protocol;
}
} catch (MalformedURLException e) {
throw new ProtocolNotFound(urlString, e.toString());
} catch (PluginRuntimeException e) {
throw new ProtocolNotFound(urlString, e.toString());
}
}
private Extension findExtension(String name) throws PluginRuntimeException {
Extension[] extensions = this.extensionPoint.getExtensions();
for (int i = 0; i < extensions.length; i++) {
Extension extension = extensions[i];
if (contains(name, extension.getAttribute("protocolName")))
return extension;
}
return null;
}
boolean contains(String what, String where){
String parts[]=where.split("[, ]");
for(int i=0;i<parts.length;i++) {
if(parts[i].equals(what)) return true;
}
return false;
}
public Set<String> getColumnSet() {
Set<String> columnSet = new HashSet<String>();
for (Extension extension : this.extensionPoint.getExtensions()) {
ProtocolHbase protocol;
try {
protocol = (ProtocolHbase) extension.getExtensionInstance();
columnSet.addAll(protocol.getColumnSet());
} catch (PluginRuntimeException e) {
// ignore
}
}
return columnSet;
}
}