blob: 50daa57fd0fdeadec1aba2fa4483a6a717ea52a3 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.nutch.plugin;
import java.lang.invoke.MethodHandles;
import java.lang.reflect.Array;
import java.lang.reflect.Constructor;
import java.lang.reflect.InvocationTargetException;
import java.lang.reflect.Method;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.HashMap;
import java.util.WeakHashMap;
import java.util.List;
import java.util.Map;
import java.util.regex.Pattern;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.apache.hadoop.conf.Configuration;
import org.apache.nutch.util.NutchConfiguration;
import org.apache.nutch.util.ObjectCache;
/**
* The plugin repositority is a registry of all plugins.
*
* At system boot up a repositority is builded by parsing the mainifest files of
* all plugins. Plugins that require not existing other plugins are not
* registed. For each plugin a plugin descriptor instance will be created. The
* descriptor represents all meta information about a plugin. So a plugin
* instance will be created later when it is required, this allow lazy plugin
* loading.
*/
public class PluginRepository {
private static final WeakHashMap<String, PluginRepository> CACHE = new WeakHashMap<>();
private boolean auto;
private List<PluginDescriptor> fRegisteredPlugins;
private HashMap<String, ExtensionPoint> fExtensionPoints;
private HashMap<String, Plugin> fActivatedPlugins;
private static final Map<String, Map<PluginClassLoader, Class>> CLASS_CACHE = new HashMap<>();
private Configuration conf;
protected static final Logger LOG = LoggerFactory
.getLogger(MethodHandles.lookup().lookupClass());
/**
* @throws RuntimeException
* @see java.lang.Object#Object()
*/
public PluginRepository(Configuration conf) throws RuntimeException {
fActivatedPlugins = new HashMap<>();
fExtensionPoints = new HashMap<>();
this.conf = new Configuration(conf);
this.auto = conf.getBoolean("plugin.auto-activation", true);
String[] pluginFolders = conf.getStrings("plugin.folders");
PluginManifestParser manifestParser = new PluginManifestParser(this.conf,
this);
Map<String, PluginDescriptor> allPlugins = manifestParser
.parsePluginFolder(pluginFolders);
if (allPlugins.isEmpty()) {
LOG.warn("No plugins found on paths of property plugin.folders=\"{}\"",
conf.get("plugin.folders"));
}
Pattern excludes = Pattern.compile(conf.get("plugin.excludes", ""));
Pattern includes = Pattern.compile(conf.get("plugin.includes", ""));
Map<String, PluginDescriptor> filteredPlugins = filter(excludes, includes,
allPlugins);
fRegisteredPlugins = getDependencyCheckedPlugins(filteredPlugins,
this.auto ? allPlugins : filteredPlugins);
installExtensionPoints(fRegisteredPlugins);
try {
installExtensions(fRegisteredPlugins);
} catch (PluginRuntimeException e) {
LOG.error(e.toString());
throw new RuntimeException(e.getMessage());
}
displayStatus();
}
/**
* @return a cached instance of the plugin repository
*/
public static synchronized PluginRepository get(Configuration conf) {
String uuid = NutchConfiguration.getUUID(conf);
if (uuid == null) {
uuid = "nonNutchConf@" + conf.hashCode(); // fallback
}
PluginRepository result = CACHE.get(uuid);
if (result == null) {
result = new PluginRepository(conf);
CACHE.put(uuid, result);
}
return result;
}
private void installExtensionPoints(List<PluginDescriptor> plugins) {
if (plugins == null) {
return;
}
for (PluginDescriptor plugin : plugins) {
for (ExtensionPoint point : plugin.getExtenstionPoints()) {
String xpId = point.getId();
LOG.debug("Adding extension point " + xpId);
fExtensionPoints.put(xpId, point);
}
}
}
/**
* @param pRegisteredPlugins
*/
private void installExtensions(List<PluginDescriptor> pRegisteredPlugins)
throws PluginRuntimeException {
for (PluginDescriptor descriptor : pRegisteredPlugins) {
for (Extension extension : descriptor.getExtensions()) {
String xpId = extension.getTargetPoint();
ExtensionPoint point = getExtensionPoint(xpId);
if (point == null) {
throw new PluginRuntimeException("Plugin ("
+ descriptor.getPluginId() + "), " + "extension point: " + xpId
+ " does not exist.");
}
point.addExtension(extension);
}
}
}
private void getPluginCheckedDependencies(PluginDescriptor plugin,
Map<String, PluginDescriptor> plugins,
Map<String, PluginDescriptor> dependencies,
Map<String, PluginDescriptor> branch) throws MissingDependencyException,
CircularDependencyException {
if (dependencies == null) {
dependencies = new HashMap<>();
}
if (branch == null) {
branch = new HashMap<>();
}
branch.put(plugin.getPluginId(), plugin);
// Otherwise, checks each dependency
for (String id : plugin.getDependencies()) {
PluginDescriptor dependency = plugins.get(id);
if (dependency == null) {
throw new MissingDependencyException("Missing dependency " + id
+ " for plugin " + plugin.getPluginId());
}
if (branch.containsKey(id)) {
throw new CircularDependencyException("Circular dependency detected "
+ id + " for plugin " + plugin.getPluginId());
}
dependencies.put(id, dependency);
getPluginCheckedDependencies(plugins.get(id), plugins, dependencies,
branch);
}
branch.remove(plugin.getPluginId());
}
private Map<String, PluginDescriptor> getPluginCheckedDependencies(
PluginDescriptor plugin, Map<String, PluginDescriptor> plugins)
throws MissingDependencyException, CircularDependencyException {
Map<String, PluginDescriptor> dependencies = new HashMap<>();
Map<String, PluginDescriptor> branch = new HashMap<>();
getPluginCheckedDependencies(plugin, plugins, dependencies, branch);
return dependencies;
}
/**
* @param filtered
* is the list of plugin filtred
* @param all
* is the list of all plugins found.
* @return List
*/
private List<PluginDescriptor> getDependencyCheckedPlugins(
Map<String, PluginDescriptor> filtered, Map<String, PluginDescriptor> all) {
if (filtered == null) {
return null;
}
Map<String, PluginDescriptor> checked = new HashMap<>();
for (PluginDescriptor plugin : filtered.values()) {
try {
checked.putAll(getPluginCheckedDependencies(plugin, all));
checked.put(plugin.getPluginId(), plugin);
} catch (MissingDependencyException mde) {
// Logger exception and ignore plugin
LOG.warn(mde.getMessage());
} catch (CircularDependencyException cde) {
// Simply ignore this plugin
LOG.warn(cde.getMessage());
}
}
return new ArrayList<>(checked.values());
}
/**
* Returns all registed plugin descriptors.
*
* @return PluginDescriptor[]
*/
public PluginDescriptor[] getPluginDescriptors() {
return fRegisteredPlugins.toArray(new PluginDescriptor[fRegisteredPlugins
.size()]);
}
/**
* Returns the descriptor of one plugin identified by a plugin id.
*
* @param pPluginId
* @return PluginDescriptor
*/
public PluginDescriptor getPluginDescriptor(String pPluginId) {
for (PluginDescriptor descriptor : fRegisteredPlugins) {
if (descriptor.getPluginId().equals(pPluginId))
return descriptor;
}
return null;
}
/**
* Returns a extension point indentified by a extension point id.
*
* @param pXpId
* @return a extentsion point
*/
public ExtensionPoint getExtensionPoint(String pXpId) {
return this.fExtensionPoints.get(pXpId);
}
/**
* Returns a instance of a plugin. Plugin instances are cached. So a plugin
* exist only as one instance. This allow a central management of plugin own
* resources.
*
* After creating the plugin instance the startUp() method is invoked. The
* plugin use a own classloader that is used as well by all instance of
* extensions of the same plugin. This class loader use all exported libraries
* from the dependend plugins and all plugin libraries.
*
* @param pDescriptor
* @return Plugin
* @throws PluginRuntimeException
*/
public Plugin getPluginInstance(PluginDescriptor pDescriptor)
throws PluginRuntimeException {
if (fActivatedPlugins.containsKey(pDescriptor.getPluginId()))
return fActivatedPlugins.get(pDescriptor.getPluginId());
try {
// Must synchronize here to make sure creation and initialization
// of a plugin instance are done by one and only one thread.
// The same is in Extension.getExtensionInstance().
// Suggested by Stefan Groschupf <sg@media-style.com>
synchronized (pDescriptor) {
Class<?> pluginClass = getCachedClass(pDescriptor,
pDescriptor.getPluginClass());
Constructor<?> constructor = pluginClass.getConstructor(new Class<?>[] {
PluginDescriptor.class, Configuration.class });
Plugin plugin = (Plugin) constructor.newInstance(new Object[] {
pDescriptor, this.conf });
plugin.startUp();
fActivatedPlugins.put(pDescriptor.getPluginId(), plugin);
return plugin;
}
} catch (ClassNotFoundException e) {
throw new PluginRuntimeException(e);
} catch (InstantiationException e) {
throw new PluginRuntimeException(e);
} catch (IllegalAccessException e) {
throw new PluginRuntimeException(e);
} catch (NoSuchMethodException e) {
throw new PluginRuntimeException(e);
} catch (InvocationTargetException e) {
throw new PluginRuntimeException(e);
}
}
/*
* (non-Javadoc)
*
* @see java.lang.Object#finalize()
*/
public void finalize() throws Throwable {
shutDownActivatedPlugins();
}
/**
* Shuts down all plugins
*
* @throws PluginRuntimeException
*/
private void shutDownActivatedPlugins() throws PluginRuntimeException {
for (Plugin plugin : fActivatedPlugins.values()) {
plugin.shutDown();
}
}
public Class getCachedClass(PluginDescriptor pDescriptor, String className)
throws ClassNotFoundException {
Map<PluginClassLoader, Class> descMap = CLASS_CACHE.get(className);
if (descMap == null) {
descMap = new HashMap<>();
CLASS_CACHE.put(className, descMap);
}
PluginClassLoader loader = pDescriptor.getClassLoader();
Class clazz = descMap.get(loader);
if (clazz == null) {
clazz = loader.loadClass(className);
descMap.put(loader, clazz);
}
return clazz;
}
private void displayStatus() {
LOG.info("Plugin Auto-activation mode: [" + this.auto + "]");
LOG.info("Registered Plugins:");
if ((fRegisteredPlugins == null) || (fRegisteredPlugins.size() == 0)) {
LOG.info("\tNONE");
} else {
for (PluginDescriptor plugin : fRegisteredPlugins) {
LOG.info("\t" + plugin.getName() + " (" + plugin.getPluginId() + ")");
}
}
LOG.info("Registered Extension-Points:");
if ((fExtensionPoints == null) || (fExtensionPoints.size() == 0)) {
LOG.info("\tNONE");
} else {
for (ExtensionPoint ep : fExtensionPoints.values()) {
LOG.info("\t" + ep.getName() + " (" + ep.getId() + ")");
}
}
}
/**
* Filters a list of plugins. The list of plugins is filtered regarding the
* configuration properties <code>plugin.excludes</code> and
* <code>plugin.includes</code>.
*
* @param excludes
* @param includes
* @param plugins
* Map of plugins
* @return map of plugins matching the configuration
*/
private Map<String, PluginDescriptor> filter(Pattern excludes,
Pattern includes, Map<String, PluginDescriptor> plugins) {
Map<String, PluginDescriptor> map = new HashMap<>();
if (plugins == null) {
return map;
}
for (PluginDescriptor plugin : plugins.values()) {
if (plugin == null) {
continue;
}
String id = plugin.getPluginId();
if (id == null) {
continue;
}
if (!includes.matcher(id).matches()) {
LOG.debug("not including: " + id);
continue;
}
if (excludes.matcher(id).matches()) {
LOG.debug("excluding: " + id);
continue;
}
map.put(plugin.getPluginId(), plugin);
}
return map;
}
/**
* Get ordered list of plugins. Filter and normalization plugins are applied
* in a configurable "pipeline" order, e.g., if one plugin depends on the
* output of another plugin. This method loads the plugins in the order
* defined by orderProperty. If orderProperty is empty or unset, all active
* plugins of the given interface and extension point are loaded.
*
* @param clazz
* interface class implemented by required plugins
* @param xPointId
* extension point id of required plugins
* @param orderProperty
* property name defining plugin order
* @return array of plugin instances
*/
public synchronized Object[] getOrderedPlugins(Class<?> clazz,
String xPointId, String orderProperty) {
Object[] filters;
ObjectCache objectCache = ObjectCache.get(conf);
filters = (Object[]) objectCache.getObject(clazz.getName());
if (filters == null) {
String order = conf.get(orderProperty);
List<String> orderOfFilters = new ArrayList<>();
boolean userDefinedOrder = false;
if (order != null && !order.trim().isEmpty()) {
orderOfFilters = Arrays.asList(order.trim().split("\\s+"));
userDefinedOrder = true;
}
try {
ExtensionPoint point = PluginRepository.get(conf).getExtensionPoint(
xPointId);
if (point == null)
throw new RuntimeException(xPointId + " not found.");
Extension[] extensions = point.getExtensions();
HashMap<String, Object> filterMap = new HashMap<>();
for (int i = 0; i < extensions.length; i++) {
Extension extension = extensions[i];
Object filter = extension.getExtensionInstance();
if (!filterMap.containsKey(filter.getClass().getName())) {
filterMap.put(filter.getClass().getName(), filter);
if (!userDefinedOrder)
orderOfFilters.add(filter.getClass().getName());
}
}
List<Object> sorted = new ArrayList<>();
for (String orderedFilter : orderOfFilters) {
Object f = filterMap.get(orderedFilter);
if (f == null) {
LOG.error(clazz.getSimpleName() + " : " + orderedFilter
+ " declared in configuration property " + orderProperty
+ " but not found in an active plugin - ignoring.");
continue;
}
sorted.add(f);
}
Object[] filter = (Object[]) Array.newInstance(clazz, sorted.size());
for (int i = 0; i < sorted.size(); i++) {
filter[i] = sorted.get(i);
if (LOG.isTraceEnabled()) {
LOG.trace(clazz.getSimpleName() + " : filters[" + i + "] = "
+ filter[i].getClass());
}
}
objectCache.setObject(clazz.getName(), filter);
} catch (PluginRuntimeException e) {
throw new RuntimeException(e);
}
filters = (Object[]) objectCache.getObject(clazz.getName());
}
return filters;
}
/**
* Loads all necessary dependencies for a selected plugin, and then runs one
* of the classes' main() method.
*
* @param args
* plugin ID (needs to be activated in the configuration), and the
* class name. The rest of arguments is passed to the main method of
* the selected class.
* @throws Exception
*/
public static void main(String[] args) throws Exception {
if (args.length < 2) {
System.err
.println("Usage: PluginRepository pluginId className [arg1 arg2 ...]");
return;
}
Configuration conf = NutchConfiguration.create();
PluginRepository repo = new PluginRepository(conf);
// args[0] - plugin ID
PluginDescriptor d = repo.getPluginDescriptor(args[0]);
if (d == null) {
System.err.println("Plugin '" + args[0] + "' not present or inactive.");
return;
}
ClassLoader cl = d.getClassLoader();
// args[1] - class name
Class<?> clazz = null;
try {
clazz = Class.forName(args[1], true, cl);
} catch (Exception e) {
System.err.println("Could not load the class '" + args[1] + ": "
+ e.getMessage());
return;
}
Method m = null;
try {
m = clazz.getMethod("main", new Class<?>[] { args.getClass() });
} catch (Exception e) {
System.err.println("Could not find the 'main(String[])' method in class "
+ args[1] + ": " + e.getMessage());
return;
}
String[] subargs = new String[args.length - 2];
System.arraycopy(args, 2, subargs, 0, subargs.length);
m.invoke(null, new Object[] { subargs });
}
}