blob: 885165247ffb06ed3627c3ca9a2b6576cd005d6c [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one or more contributor license
* agreements. See the NOTICE file distributed with this work for additional information regarding
* copyright ownership. The ASF licenses this file to You under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance with the License. You may obtain a
* copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software distributed under the License
* is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
* or implied. See the License for the specific language governing permissions and limitations under
* the License.
*/
package org.apache.geode.internal.cache.control;
import java.util.ArrayList;
import java.util.Collection;
import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.List;
import java.util.Map;
import java.util.Objects;
import java.util.Set;
import java.util.concurrent.CompletableFuture;
import java.util.concurrent.CopyOnWriteArraySet;
import java.util.concurrent.ExecutorService;
import java.util.concurrent.Future;
import java.util.concurrent.RejectedExecutionException;
import java.util.concurrent.ScheduledExecutorService;
import java.util.concurrent.TimeUnit;
import org.apache.logging.log4j.Logger;
import org.apache.geode.CancelCriterion;
import org.apache.geode.InternalGemFireError;
import org.apache.geode.annotations.internal.MutableForTesting;
import org.apache.geode.cache.Cache;
import org.apache.geode.cache.Region;
import org.apache.geode.cache.control.RebalanceFactory;
import org.apache.geode.cache.control.RebalanceOperation;
import org.apache.geode.cache.control.ResourceManager;
import org.apache.geode.distributed.DistributedMember;
import org.apache.geode.distributed.internal.DistributionAdvisor.Profile;
import org.apache.geode.distributed.internal.DistributionConfig;
import org.apache.geode.distributed.internal.DistributionManager;
import org.apache.geode.internal.ClassPathLoader;
import org.apache.geode.internal.cache.InternalCache;
import org.apache.geode.internal.cache.PartitionedRegion;
import org.apache.geode.internal.cache.control.ResourceAdvisor.ResourceManagerProfile;
import org.apache.geode.internal.cache.partitioned.LoadProbe;
import org.apache.geode.internal.cache.partitioned.SizedBasedLoadProbe;
import org.apache.geode.internal.logging.CoreLoggingExecutors;
import org.apache.geode.internal.monitoring.ThreadsMonitoring;
import org.apache.geode.logging.internal.executors.LoggingExecutors;
import org.apache.geode.logging.internal.log4j.api.LogService;
/**
* Implementation of ResourceManager with additional internal-only methods.
* <p>
* TODO: cleanup raw and typed collections
*/
public class InternalResourceManager implements ResourceManager {
private static final Logger logger = LogService.getLogger();
final int MAX_RESOURCE_MANAGER_EXE_THREADS =
Integer.getInteger(DistributionConfig.GEMFIRE_PREFIX + "resource.manager.threads", 1);
private final Collection<CompletableFuture<Void>> startupTasks = new ArrayList<>();
public enum ResourceType {
HEAP_MEMORY(0x1), OFFHEAP_MEMORY(0x2), MEMORY(0x3), ALL(0xFFFFFFFF);
final int id;
ResourceType(final int id) {
this.id = id;
}
}
private Map<ResourceType, Set<ResourceListener>> listeners =
new HashMap<ResourceType, Set<ResourceListener>>();
private final ScheduledExecutorService scheduledExecutor;
private final ExecutorService notifyExecutor;
// The set of in progress rebalance operations.
private final Set<RebalanceOperation> inProgressOperations = new HashSet<RebalanceOperation>();
private final Object inProgressOperationsLock = new Object();
final InternalCache cache;
private LoadProbe loadProbe;
private final ResourceManagerStats stats;
private final ResourceAdvisor resourceAdvisor;
private boolean closed = true;
private final Map<ResourceType, ResourceMonitor> resourceMonitors;
@MutableForTesting
private static ResourceObserver observer = new ResourceObserverAdapter();
private static final String PR_LOAD_PROBE_CLASS =
System.getProperty(DistributionConfig.GEMFIRE_PREFIX + "ResourceManager.PR_LOAD_PROBE_CLASS",
SizedBasedLoadProbe.class.getName());
public static InternalResourceManager getInternalResourceManager(Cache cache) {
return (InternalResourceManager) cache.getResourceManager();
}
public static InternalResourceManager createResourceManager(final InternalCache cache) {
return new InternalResourceManager(cache);
}
private InternalResourceManager(InternalCache cache) {
this.cache = cache;
this.resourceAdvisor = (ResourceAdvisor) cache.getDistributionAdvisor();
this.stats = new ResourceManagerStats(cache.getDistributedSystem());
// Create a new executor that other classes may use for handling resource
// related tasks
this.scheduledExecutor = LoggingExecutors
.newScheduledThreadPool("ResourceManagerRecoveryThread ", MAX_RESOURCE_MANAGER_EXE_THREADS);
// Initialize the load probe
try {
Class loadProbeClass = ClassPathLoader.getLatest().forName(PR_LOAD_PROBE_CLASS);
this.loadProbe = (LoadProbe) loadProbeClass.newInstance();
} catch (Exception e) {
throw new InternalGemFireError("Unable to instantiate " + PR_LOAD_PROBE_CLASS, e);
}
// Create a new executor the resource manager and the monitors it creates
// can use to handle dispatching of notifications.
this.notifyExecutor =
CoreLoggingExecutors.newSerialThreadPoolWithFeedStatistics("Notification Handler",
thread -> thread.setPriority(Thread.MAX_PRIORITY), null,
this.stats.getResourceEventPoolStatHelper(), getThreadMonitorObj(),
0, this.stats.getResourceEventQueueStatHelper());
// Create the monitors
Map<ResourceType, ResourceMonitor> tempMonitors = new HashMap<ResourceType, ResourceMonitor>();
tempMonitors.put(ResourceType.HEAP_MEMORY, new HeapMemoryMonitor(this, cache, this.stats));
tempMonitors.put(ResourceType.OFFHEAP_MEMORY,
new OffHeapMemoryMonitor(this, cache, cache.getOffHeapStore(), this.stats));
this.resourceMonitors = Collections.unmodifiableMap(tempMonitors);
// Initialize the listener sets so that it only needs to be done once
for (ResourceType resourceType : new ResourceType[] {ResourceType.HEAP_MEMORY,
ResourceType.OFFHEAP_MEMORY}) {
Set<ResourceListener> emptySet = new CopyOnWriteArraySet<ResourceListener>();
this.listeners.put(resourceType, emptySet);
}
this.closed = false;
}
public void close() {
for (ResourceMonitor monitor : this.resourceMonitors.values()) {
monitor.stopMonitoring();
}
stopExecutor(this.scheduledExecutor);
stopExecutor(this.notifyExecutor);
this.stats.close();
this.closed = true;
}
boolean isClosed() {
return this.closed;
}
public void fillInProfile(final Profile profile) {
assert profile instanceof ResourceManagerProfile;
for (ResourceMonitor monitor : this.resourceMonitors.values()) {
monitor.fillInProfile((ResourceManagerProfile) profile);
}
}
public void addResourceListener(final ResourceListener listener) {
addResourceListener(ResourceType.ALL, listener);
}
public void addResourceListener(final ResourceType resourceType,
final ResourceListener listener) {
for (Map.Entry<ResourceType, Set<ResourceListener>> mapEntry : this.listeners.entrySet()) {
if ((mapEntry.getKey().id & resourceType.id) != 0) {
mapEntry.getValue().add(listener);
}
}
}
public void removeResourceListener(final ResourceListener listener) {
removeResourceListener(ResourceType.ALL, listener);
}
public void removeResourceListener(final ResourceType resourceType,
final ResourceListener listener) {
for (Map.Entry<ResourceType, Set<ResourceListener>> mapEntry : this.listeners.entrySet()) {
if ((mapEntry.getKey().id & resourceType.id) != 0) {
mapEntry.getValue().remove(listener);
}
}
}
public Set<ResourceListener> getResourceListeners(final ResourceType resourceType) {
return this.listeners.get(resourceType);
}
/**
* Deliver an event received from remote resource managers to the local listeners.
*
* @param event Event to deliver.
*/
public void deliverEventFromRemote(final ResourceEvent event) {
assert !event.isLocal();
if (this.cache.getLogger().fineEnabled()) {
this.cache.getLogger()
.fine("New remote event to deliver for member " + event.getMember() + ": event=" + event);
}
if (this.cache.getLogger().fineEnabled()) {
this.cache.getLogger()
.fine("Remote event to deliver for member " + event.getMember() + ":" + event);
}
runWithNotifyExecutor(new Runnable() {
@Override
public void run() {
deliverLocalEvent(event);
}
});
return;
}
void deliverLocalEvent(ResourceEvent event) {
// Wait for an event to be handled by all listeners before starting to send another event
synchronized (this.listeners) {
this.resourceMonitors.get(event.getType())
.notifyListeners(this.listeners.get(event.getType()), event);
}
this.stats.incResourceEventsDelivered();
}
public HeapMemoryMonitor getHeapMonitor() {
return (HeapMemoryMonitor) this.resourceMonitors.get(ResourceType.HEAP_MEMORY);
}
public OffHeapMemoryMonitor getOffHeapMonitor() {
return (OffHeapMemoryMonitor) this.resourceMonitors.get(ResourceType.OFFHEAP_MEMORY);
}
public MemoryMonitor getMemoryMonitor(boolean offheap) {
if (offheap) {
return getOffHeapMonitor();
} else {
return getHeapMonitor();
}
}
/**
* Use threshold event processor to execute the event embedded in the runnable.
*
* @param runnable Runnable to execute.
*/
void runWithNotifyExecutor(Runnable runnable) {
try {
this.notifyExecutor.execute(runnable);
} catch (RejectedExecutionException ignore) {
if (!isClosed()) {
this.cache.getLogger()
.warning("No memory events will be delivered because of RejectedExecutionException");
}
}
}
@Override
public RebalanceFactory createRebalanceFactory() {
return new RebalanceFactoryImpl();
}
@Override
public Set<RebalanceOperation> getRebalanceOperations() {
synchronized (this.inProgressOperationsLock) {
return new HashSet<RebalanceOperation>(this.inProgressOperations);
}
}
void addInProgressRebalance(RebalanceOperation op) {
synchronized (this.inProgressOperationsLock) {
this.inProgressOperations.add(op);
}
}
void removeInProgressRebalance(RebalanceOperation op) {
synchronized (this.inProgressOperationsLock) {
this.inProgressOperations.remove(op);
}
}
class RebalanceFactoryImpl implements RebalanceFactory {
private Set<String> includedRegions;
private Set<String> excludedRegions;
@Override
public RebalanceOperation simulate() {
RegionFilter filter = new FilterByPath(this.includedRegions, this.excludedRegions);
RebalanceOperationImpl op =
new RebalanceOperationImpl(InternalResourceManager.this.cache, true, filter);
op.start();
return op;
}
@Override
public RebalanceOperation start() {
RegionFilter filter = new FilterByPath(this.includedRegions, this.excludedRegions);
RebalanceOperationImpl op =
new RebalanceOperationImpl(InternalResourceManager.this.cache, false, filter);
op.start();
return op;
}
@Override
public RebalanceFactory excludeRegions(Set<String> regions) {
this.excludedRegions = regions;
return this;
}
@Override
public RebalanceFactory includeRegions(Set<String> regions) {
this.includedRegions = regions;
return this;
}
}
void stopExecutor(ExecutorService executor) {
if (executor == null) {
return;
}
executor.shutdown();
final int secToWait = Integer
.getInteger(DistributionConfig.GEMFIRE_PREFIX + "prrecovery-close-timeout", 5).intValue();
try {
executor.awaitTermination(secToWait, TimeUnit.SECONDS);
} catch (InterruptedException x) {
Thread.currentThread().interrupt();
logger.debug("Failed in interrupting the Resource Manager Thread due to interrupt");
}
if (!executor.isTerminated()) {
logger.warn("Failed to stop resource manager threads in {} seconds, forcing shutdown",
secToWait);
List<Runnable> remainingTasks = executor.shutdownNow();
remainingTasks.forEach(runnable -> {
if (runnable instanceof Future) {
((Future) runnable).cancel(true);
}
});
}
}
public ScheduledExecutorService getExecutor() {
return this.scheduledExecutor;
}
public ResourceManagerStats getStats() {
return this.stats;
}
/**
* For testing only, an observer which is called when rebalancing is started and finished for a
* particular region. This observer is called even the "rebalancing" is actually redundancy
* recovery for a particular region.
*
*/
public static void setResourceObserver(ResourceObserver observer) {
if (observer == null) {
observer = new ResourceObserverAdapter();
}
InternalResourceManager.observer = observer;
}
/**
* Get the resource observer used for testing. Never returns null.
*/
public static ResourceObserver getResourceObserver() {
return observer;
}
/**
* For testing only. Receives callbacks for resource related events.
*/
public interface ResourceObserver {
/**
* Indicates that rebalancing has started on a given region.
*
*/
void rebalancingStarted(Region region);
/**
* Indicates that rebalancing has finished on a given region.
*
*/
void rebalancingFinished(Region region);
/**
* Indicates that recovery has started on a given region.
*
*/
void recoveryStarted(Region region);
/**
* Indicates that recovery has finished on a given region.
*
*/
void recoveryFinished(Region region);
/**
* Indicated that a membership event triggered a recovery operation, but the recovery operation
* will not be executed because there is already an existing recovery operation waiting to
* happen on this region.
*
*/
void recoveryConflated(PartitionedRegion region);
/**
* Indicates that a bucket is being moved from the source member to the target member.
*
* @param region the region
* @param bucketId the bucket being moved
* @param source the member the bucket is moving from
* @param target the member the bucket is moving to
*/
void movingBucket(Region region, int bucketId, DistributedMember source,
DistributedMember target);
/**
* Indicates that a bucket primary is being moved from the source member to the target member.
*
* @param region the region
* @param bucketId the bucket primary being moved
* @param source the member the bucket primary is moving from
* @param target the member the bucket primary is moving to
*/
void movingPrimary(Region region, int bucketId, DistributedMember source,
DistributedMember target);
}
public static class ResourceObserverAdapter implements ResourceObserver {
@Override
public void rebalancingFinished(Region region) {
rebalancingOrRecoveryFinished(region);
}
@Override
public void rebalancingStarted(Region region) {
rebalancingOrRecoveryStarted(region);
}
@Override
public void recoveryFinished(Region region) {
rebalancingOrRecoveryFinished(region);
}
@Override
public void recoveryStarted(Region region) {
rebalancingOrRecoveryStarted(region);
}
/**
* Indicated the a rebalance or a recovery has started.
*/
@SuppressWarnings("unused")
public void rebalancingOrRecoveryStarted(Region region) {
// do nothing
}
/**
* Indicated the a rebalance or a recovery has finished.
*/
@SuppressWarnings("unused")
public void rebalancingOrRecoveryFinished(Region region) {
// do nothing
}
@Override
public void recoveryConflated(PartitionedRegion region) {
// do nothing
}
@Override
public void movingBucket(Region region, int bucketId, DistributedMember source,
DistributedMember target) {
// do nothing
}
@Override
public void movingPrimary(Region region, int bucketId, DistributedMember source,
DistributedMember target) {
// do nothing
}
}
/*
* (non-Javadoc)
*
* @see org.apache.geode.distributed.internal.DistributionAdvisee#getCancelCriterion()
*/
public CancelCriterion getCancelCriterion() {
return this.cache.getCancelCriterion();
}
public ResourceAdvisor getResourceAdvisor() {
return this.resourceAdvisor;
}
public LoadProbe getLoadProbe() {
return this.loadProbe;
}
/**
* This method is test purposes only.
*/
public LoadProbe setLoadProbe(LoadProbe probe) {
LoadProbe old = this.loadProbe;
this.loadProbe = probe;
return old;
}
/*
* (non-Javadoc)
*
* @see org.apache.geode.cache.control.ResourceManager#setEvictionHeapPercentage(int)
*/
@Override
public void setCriticalOffHeapPercentage(float offHeapPercentage) {
getOffHeapMonitor().setCriticalThreshold(offHeapPercentage);
}
/**
* {@inheritDoc}
*/
@Override
public float getCriticalOffHeapPercentage() {
return getOffHeapMonitor().getCriticalThreshold();
}
/**
* {@inheritDoc}
*/
@Override
public void setEvictionOffHeapPercentage(float offHeapPercentage) {
getOffHeapMonitor().setEvictionThreshold(offHeapPercentage);
}
/**
* {@inheritDoc}
*/
@Override
public float getEvictionOffHeapPercentage() {
return getOffHeapMonitor().getEvictionThreshold();
}
/**
* {@inheritDoc}
*/
@Override
public void setCriticalHeapPercentage(float heapPercentage) {
getHeapMonitor().setCriticalThreshold(heapPercentage);
}
/**
* {@inheritDoc}
*/
@Override
public float getCriticalHeapPercentage() {
return getHeapMonitor().getCriticalThreshold();
}
/**
* {@inheritDoc}
*/
@Override
public void setEvictionHeapPercentage(float heapPercentage) {
getHeapMonitor().setEvictionThreshold(heapPercentage);
}
/**
* {@inheritDoc}
*/
@Override
public float getEvictionHeapPercentage() {
return getHeapMonitor().getEvictionThreshold();
}
private ThreadsMonitoring getThreadMonitorObj() {
DistributionManager distributionManager = this.cache.getDistributionManager();
if (distributionManager != null) {
return distributionManager.getThreadMonitoring();
} else {
return null;
}
}
/**
* Adds a task that represents an asynchronous action during startup
*
* @param startupTask the CompletableFuture startup task
*/
public void addStartupTask(CompletableFuture<Void> startupTask) {
Objects.requireNonNull(startupTask);
startupTasks.add(startupTask);
}
/**
* Clears the startup tasks and returns a CompletableFuture that completes when all of the startup
* tasks complete.
*
* @return a CompletableFuture that completes when all of the startup tasks complete
*/
public CompletableFuture<Void> allOfStartupTasks() {
CompletableFuture[] completableFutures = startupTasks.toArray(new CompletableFuture[0]);
startupTasks.clear();
return CompletableFuture.allOf(completableFutures);
}
}