blob: 6a4c921a0a1708c623a7ca22327ac9a44e672eb2 [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.tika.pipes.fetcher;
import java.io.IOException;
import java.io.InputStream;
import java.nio.file.Files;
import java.nio.file.Path;
import java.util.List;
import java.util.Map;
import java.util.Set;
import java.util.concurrent.ConcurrentHashMap;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.apache.tika.config.ConfigBase;
import org.apache.tika.exception.TikaConfigException;
import org.apache.tika.exception.TikaException;
/**
* Utility class to hold multiple fetchers.
* <p>
* This forbids multiple fetchers supporting the same name.
*/
public class FetcherManager extends ConfigBase {
private static final Logger LOG = LoggerFactory.getLogger(FetcherManager.class);
public static FetcherManager load(Path p) throws IOException, TikaConfigException {
try (InputStream is =
Files.newInputStream(p)) {
return FetcherManager.buildComposite("fetchers", FetcherManager.class,
"fetcher", Fetcher.class, is);
}
}
private final Map<String, Fetcher> fetcherMap = new ConcurrentHashMap<>();
public FetcherManager(List<Fetcher> fetchers) throws TikaConfigException {
for (Fetcher fetcher : fetchers) {
String name = fetcher.getName();
if (name == null || name.trim().isEmpty()) {
throw new TikaConfigException("Fetcher name must not be blank");
}
if (fetcherMap.containsKey(fetcher.getName())) {
LOG.warn("Duplicate fetcher saved in the tika-config xml: {}. Ignoring.", fetcher.getName());
continue;
}
fetcherMap.put(fetcher.getName(), fetcher);
}
}
public Fetcher getFetcher(String fetcherName) throws IOException, TikaException {
Fetcher fetcher = fetcherMap.get(fetcherName);
if (fetcher == null) {
throw new IllegalArgumentException(
"Can't find fetcher for fetcherName: " + fetcherName + ". I've loaded: " +
fetcherMap.keySet());
}
return fetcher;
}
public Set<String> getSupported() {
return fetcherMap.keySet();
}
/**
* Convenience method that returns a fetcher if only one fetcher
* is specified in the tika-config file. If 0 or > 1 fetchers
* are specified, this throws an IllegalArgumentException.
* @return
*/
public Fetcher getFetcher() {
if (fetcherMap.size() == 0) {
throw new IllegalArgumentException("fetchers size must == 1 for the no arg call");
}
if (fetcherMap.size() > 1) {
throw new IllegalArgumentException("need to specify 'fetcherName' if > 1 fetchers are" +
" available");
}
for (Fetcher fetcher : fetcherMap.values()) {
return fetcher;
}
//this should be unreachable?!
throw new IllegalArgumentException("fetchers size must == 0");
}
}