| /** |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| package org.apache.hadoop.hbase.wal; |
| |
| import static org.apache.hadoop.hbase.wal.AbstractFSWALProvider.getWALArchiveDirectoryName; |
| import static org.apache.hadoop.hbase.wal.AbstractFSWALProvider.getWALDirectoryName; |
| |
| import java.io.IOException; |
| import java.lang.reflect.Constructor; |
| import java.lang.reflect.InvocationTargetException; |
| import java.util.ArrayList; |
| import java.util.List; |
| import java.util.Optional; |
| import java.util.concurrent.ConcurrentHashMap; |
| import java.util.concurrent.ConcurrentMap; |
| import java.util.concurrent.atomic.AtomicBoolean; |
| import java.util.concurrent.locks.Lock; |
| import java.util.function.BiPredicate; |
| import java.util.regex.Matcher; |
| import java.util.regex.Pattern; |
| import java.util.stream.Collectors; |
| import java.util.stream.Stream; |
| import org.apache.hadoop.conf.Configuration; |
| import org.apache.hadoop.hbase.Abortable; |
| import org.apache.hadoop.hbase.TableName; |
| import org.apache.hadoop.hbase.client.RegionInfo; |
| import org.apache.hadoop.hbase.regionserver.wal.DualAsyncFSWAL; |
| import org.apache.hadoop.hbase.regionserver.wal.WALActionsListener; |
| import org.apache.hadoop.hbase.replication.ReplicationUtils; |
| import org.apache.hadoop.hbase.replication.SyncReplicationState; |
| import org.apache.hadoop.hbase.replication.regionserver.PeerActionListener; |
| import org.apache.hadoop.hbase.replication.regionserver.SyncReplicationPeerInfoProvider; |
| import org.apache.hadoop.hbase.util.CommonFSUtils; |
| import org.apache.hadoop.hbase.util.EnvironmentEdgeManager; |
| import org.apache.hadoop.hbase.util.KeyLocker; |
| import org.apache.hadoop.hbase.util.Pair; |
| import org.apache.yetus.audience.InterfaceAudience; |
| import org.slf4j.Logger; |
| import org.slf4j.LoggerFactory; |
| |
| import org.apache.hbase.thirdparty.com.google.common.base.Throwables; |
| import org.apache.hbase.thirdparty.com.google.common.collect.Streams; |
| import org.apache.hbase.thirdparty.io.netty.channel.Channel; |
| import org.apache.hbase.thirdparty.io.netty.channel.EventLoopGroup; |
| |
| /** |
| * The special {@link WALProvider} for synchronous replication. |
| * <p> |
| * It works like an interceptor, when getting WAL, first it will check if the given region should be |
| * replicated synchronously, if so it will return a special WAL for it, otherwise it will delegate |
| * the request to the normal {@link WALProvider}. |
| */ |
| @InterfaceAudience.Private |
| public class SyncReplicationWALProvider implements WALProvider, PeerActionListener { |
| |
| private static final Logger LOG = LoggerFactory.getLogger(SyncReplicationWALProvider.class); |
| |
| // only for injecting errors for testcase, do not use it for other purpose. |
| public static final String DUAL_WAL_IMPL = "hbase.wal.sync.impl"; |
| |
| private final WALProvider provider; |
| |
| private SyncReplicationPeerInfoProvider peerInfoProvider = |
| new DefaultSyncReplicationPeerInfoProvider(); |
| |
| private WALFactory factory; |
| |
| private Configuration conf; |
| |
| private List<WALActionsListener> listeners = new ArrayList<>(); |
| |
| private EventLoopGroup eventLoopGroup; |
| |
| private Class<? extends Channel> channelClass; |
| |
| private AtomicBoolean initialized = new AtomicBoolean(false); |
| |
| // when switching from A to DA, we will put a Optional.empty into this map if there is no WAL for |
| // the peer yet. When getting WAL from this map the caller should know that it should not use |
| // DualAsyncFSWAL any more. |
| private final ConcurrentMap<String, Optional<DualAsyncFSWAL>> peerId2WAL = |
| new ConcurrentHashMap<>(); |
| |
| private final KeyLocker<String> createLock = new KeyLocker<>(); |
| |
| SyncReplicationWALProvider(WALProvider provider) { |
| this.provider = provider; |
| } |
| |
| public void setPeerInfoProvider(SyncReplicationPeerInfoProvider peerInfoProvider) { |
| this.peerInfoProvider = peerInfoProvider; |
| } |
| |
| @Override |
| public void init(WALFactory factory, Configuration conf, String providerId, Abortable abortable) |
| throws IOException { |
| if (!initialized.compareAndSet(false, true)) { |
| throw new IllegalStateException("WALProvider.init should only be called once."); |
| } |
| provider.init(factory, conf, providerId, abortable); |
| this.conf = conf; |
| this.factory = factory; |
| Pair<EventLoopGroup, Class<? extends Channel>> eventLoopGroupAndChannelClass = |
| NettyAsyncFSWALConfigHelper.getEventLoopConfig(conf); |
| eventLoopGroup = eventLoopGroupAndChannelClass.getFirst(); |
| channelClass = eventLoopGroupAndChannelClass.getSecond(); |
| } |
| |
| // Use a timestamp to make it identical. That means, after we transit the peer to DA/S and then |
| // back to A, the log prefix will be changed. This is used to simplify the implementation for |
| // replication source, where we do not need to consider that a terminated shipper could be added |
| // back. |
| private String getLogPrefix(String peerId) { |
| return factory.factoryId + "-" + EnvironmentEdgeManager.currentTime() + "-" + peerId; |
| } |
| |
| private DualAsyncFSWAL createWAL(String peerId, String remoteWALDir) throws IOException { |
| Class<? extends DualAsyncFSWAL> clazz = |
| conf.getClass(DUAL_WAL_IMPL, DualAsyncFSWAL.class, DualAsyncFSWAL.class); |
| try { |
| Constructor<?> constructor = null; |
| for (Constructor<?> c : clazz.getDeclaredConstructors()) { |
| if (c.getParameterCount() > 0) { |
| constructor = c; |
| break; |
| } |
| } |
| if (constructor == null) { |
| throw new IllegalArgumentException("No valid constructor provided for class " + clazz); |
| } |
| constructor.setAccessible(true); |
| return (DualAsyncFSWAL) constructor.newInstance( |
| CommonFSUtils.getWALFileSystem(conf), |
| ReplicationUtils.getRemoteWALFileSystem(conf, remoteWALDir), |
| CommonFSUtils.getWALRootDir(conf), |
| ReplicationUtils.getPeerRemoteWALDir(remoteWALDir, peerId), |
| getWALDirectoryName(factory.factoryId), getWALArchiveDirectoryName(conf, factory.factoryId), |
| conf, listeners, true, getLogPrefix(peerId), ReplicationUtils.SYNC_WAL_SUFFIX, |
| eventLoopGroup, channelClass); |
| } catch (InstantiationException | IllegalAccessException e) { |
| throw new RuntimeException(e); |
| } catch (InvocationTargetException e) { |
| Throwable cause = e.getTargetException(); |
| Throwables.propagateIfPossible(cause, IOException.class); |
| throw new RuntimeException(cause); |
| } |
| } |
| |
| private DualAsyncFSWAL getWAL(String peerId, String remoteWALDir) throws IOException { |
| Optional<DualAsyncFSWAL> opt = peerId2WAL.get(peerId); |
| if (opt != null) { |
| return opt.orElse(null); |
| } |
| Lock lock = createLock.acquireLock(peerId); |
| try { |
| opt = peerId2WAL.get(peerId); |
| if (opt != null) { |
| return opt.orElse(null); |
| } |
| DualAsyncFSWAL wal = createWAL(peerId, remoteWALDir); |
| boolean succ = false; |
| try { |
| wal.init(); |
| succ = true; |
| } finally { |
| if (!succ) { |
| wal.close(); |
| } |
| } |
| peerId2WAL.put(peerId, Optional.of(wal)); |
| return wal; |
| } finally { |
| lock.unlock(); |
| } |
| } |
| |
| @Override |
| public WAL getWAL(RegionInfo region) throws IOException { |
| if (region == null) { |
| return provider.getWAL(null); |
| } |
| WAL wal = null; |
| Optional<Pair<String, String>> peerIdAndRemoteWALDir = |
| peerInfoProvider.getPeerIdAndRemoteWALDir(region.getTable()); |
| if (peerIdAndRemoteWALDir.isPresent()) { |
| Pair<String, String> pair = peerIdAndRemoteWALDir.get(); |
| wal = getWAL(pair.getFirst(), pair.getSecond()); |
| } |
| return wal != null ? wal : provider.getWAL(region); |
| } |
| |
| private Stream<WAL> getWALStream() { |
| return Streams.concat( |
| peerId2WAL.values().stream().filter(Optional::isPresent).map(Optional::get), |
| provider.getWALs().stream()); |
| } |
| |
| @Override |
| public List<WAL> getWALs() { |
| return getWALStream().collect(Collectors.toList()); |
| } |
| |
| @Override |
| public void shutdown() throws IOException { |
| // save the last exception and rethrow |
| IOException failure = null; |
| for (Optional<DualAsyncFSWAL> wal : peerId2WAL.values()) { |
| if (wal.isPresent()) { |
| try { |
| wal.get().shutdown(); |
| } catch (IOException e) { |
| LOG.error("Shutdown WAL failed", e); |
| failure = e; |
| } |
| } |
| } |
| provider.shutdown(); |
| if (failure != null) { |
| throw failure; |
| } |
| } |
| |
| @Override |
| public void close() throws IOException { |
| // save the last exception and rethrow |
| IOException failure = null; |
| for (Optional<DualAsyncFSWAL> wal : peerId2WAL.values()) { |
| if (wal.isPresent()) { |
| try { |
| wal.get().close(); |
| } catch (IOException e) { |
| LOG.error("Close WAL failed", e); |
| failure = e; |
| } |
| } |
| } |
| provider.close(); |
| if (failure != null) { |
| throw failure; |
| } |
| } |
| |
| @Override |
| public long getNumLogFiles() { |
| return peerId2WAL.size() + provider.getNumLogFiles(); |
| } |
| |
| @Override |
| public long getLogFileSize() { |
| return peerId2WAL.values().stream().filter(Optional::isPresent).map(Optional::get) |
| .mapToLong(DualAsyncFSWAL::getLogFileSize).sum() + provider.getLogFileSize(); |
| } |
| |
| private void safeClose(WAL wal) { |
| if (wal != null) { |
| try { |
| wal.close(); |
| } catch (IOException e) { |
| LOG.error("Close WAL failed", e); |
| } |
| } |
| } |
| |
| @Override |
| public void addWALActionsListener(WALActionsListener listener) { |
| listeners.add(listener); |
| provider.addWALActionsListener(listener); |
| } |
| |
| @Override |
| public void peerSyncReplicationStateChange(String peerId, SyncReplicationState from, |
| SyncReplicationState to, int stage) { |
| if (from == SyncReplicationState.ACTIVE) { |
| if (stage == 0) { |
| Lock lock = createLock.acquireLock(peerId); |
| try { |
| Optional<DualAsyncFSWAL> opt = peerId2WAL.get(peerId); |
| if (opt != null) { |
| opt.ifPresent(w -> w.skipRemoteWAL(to == SyncReplicationState.STANDBY)); |
| } else { |
| // add a place holder to tell the getWAL caller do not use DualAsyncFSWAL any more. |
| peerId2WAL.put(peerId, Optional.empty()); |
| } |
| } finally { |
| lock.unlock(); |
| } |
| } else if (stage == 1) { |
| peerId2WAL.remove(peerId).ifPresent(this::safeClose); |
| } |
| } |
| } |
| |
| private static class DefaultSyncReplicationPeerInfoProvider |
| implements SyncReplicationPeerInfoProvider { |
| |
| @Override |
| public Optional<Pair<String, String>> getPeerIdAndRemoteWALDir(TableName table) { |
| return Optional.empty(); |
| } |
| |
| @Override |
| public boolean checkState(TableName table, |
| BiPredicate<SyncReplicationState, SyncReplicationState> checker) { |
| return false; |
| } |
| } |
| |
| private static final Pattern LOG_PREFIX_PATTERN = Pattern.compile(".*-\\d+-(.+)"); |
| |
| /** |
| * <p> |
| * Returns the peer id if the wal file name is in the special group for a sync replication peer. |
| * </p> |
| * <p> |
| * The prefix format is <factoryId>-<ts>-<peerId>. |
| * </p> |
| */ |
| public static Optional<String> getSyncReplicationPeerIdFromWALName(String name) { |
| if (!name.endsWith(ReplicationUtils.SYNC_WAL_SUFFIX)) { |
| // fast path to return earlier if the name is not for a sync replication peer. |
| return Optional.empty(); |
| } |
| String logPrefix = AbstractFSWALProvider.getWALPrefixFromWALName(name); |
| Matcher matcher = LOG_PREFIX_PATTERN.matcher(logPrefix); |
| if (matcher.matches()) { |
| return Optional.of(matcher.group(1)); |
| } else { |
| return Optional.empty(); |
| } |
| } |
| |
| WALProvider getWrappedProvider() { |
| return provider; |
| } |
| |
| } |