| /** |
| * Licensed to the Apache Software Foundation (ASF) under one |
| * or more contributor license agreements. See the NOTICE file |
| * distributed with this work for additional information |
| * regarding copyright ownership. The ASF licenses this file |
| * to you under the Apache License, Version 2.0 (the |
| * "License"); you may not use this file except in compliance |
| * with the License. You may obtain a copy of the License at |
| * |
| * http://www.apache.org/licenses/LICENSE-2.0 |
| * |
| * Unless required by applicable law or agreed to in writing, software |
| * distributed under the License is distributed on an "AS IS" BASIS, |
| * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| * See the License for the specific language governing permissions and |
| * limitations under the License. |
| */ |
| |
| package org.apache.hadoop.yarn.server.nodemanager; |
| |
| import org.apache.hadoop.conf.Configuration; |
| import org.apache.hadoop.service.AbstractService; |
| import org.apache.hadoop.yarn.conf.YarnConfiguration; |
| import org.apache.hadoop.yarn.api.records.ResourceUtilization; |
| import org.apache.hadoop.yarn.util.ResourceCalculatorPlugin; |
| import org.slf4j.Logger; |
| import org.slf4j.LoggerFactory; |
| |
| /** |
| * Implementation of the node resource monitor. It periodically tracks the |
| * resource utilization of the node and reports it to the NM. |
| */ |
| public class NodeResourceMonitorImpl extends AbstractService implements |
| NodeResourceMonitor { |
| |
| /** Logging infrastructure. */ |
| final static Logger LOG = |
| LoggerFactory.getLogger(NodeResourceMonitorImpl.class); |
| |
| /** Interval to monitor the node resource utilization. */ |
| private long monitoringInterval; |
| /** Thread to monitor the node resource utilization. */ |
| private MonitoringThread monitoringThread; |
| |
| /** Resource calculator. */ |
| private ResourceCalculatorPlugin resourceCalculatorPlugin; |
| |
| /** Current <em>resource utilization</em> of the node. */ |
| private ResourceUtilization nodeUtilization; |
| |
| /** |
| * Initialize the node resource monitor. |
| */ |
| public NodeResourceMonitorImpl() { |
| super(NodeResourceMonitorImpl.class.getName()); |
| |
| this.monitoringThread = new MonitoringThread(); |
| } |
| |
| /** |
| * Initialize the service with the proper parameters. |
| */ |
| @Override |
| protected void serviceInit(Configuration conf) throws Exception { |
| this.monitoringInterval = |
| conf.getLong(YarnConfiguration.NM_RESOURCE_MON_INTERVAL_MS, |
| YarnConfiguration.DEFAULT_NM_RESOURCE_MON_INTERVAL_MS); |
| |
| this.resourceCalculatorPlugin = |
| ResourceCalculatorPlugin.getNodeResourceMonitorPlugin(conf); |
| |
| LOG.info(" Using ResourceCalculatorPlugin : " |
| + this.resourceCalculatorPlugin); |
| } |
| |
| /** |
| * Check if we should be monitoring. |
| * @return <em>true</em> if we can monitor the node resource utilization. |
| */ |
| private boolean isEnabled() { |
| if (this.monitoringInterval <= 0) { |
| LOG.info("Node Resource monitoring interval is <=0. " |
| + this.getClass().getName() + " is disabled."); |
| return false; |
| } |
| if (resourceCalculatorPlugin == null) { |
| LOG.info("ResourceCalculatorPlugin is unavailable on this system. " |
| + this.getClass().getName() + " is disabled."); |
| return false; |
| } |
| return true; |
| } |
| |
| /** |
| * Start the thread that does the node resource utilization monitoring. |
| */ |
| @Override |
| protected void serviceStart() throws Exception { |
| if (this.isEnabled()) { |
| this.monitoringThread.start(); |
| } |
| super.serviceStart(); |
| } |
| |
| /** |
| * Stop the thread that does the node resource utilization monitoring. |
| */ |
| @Override |
| protected void serviceStop() throws Exception { |
| if (this.isEnabled()) { |
| this.monitoringThread.interrupt(); |
| try { |
| this.monitoringThread.join(10 * 1000); |
| } catch (InterruptedException e) { |
| LOG.warn("Could not wait for the thread to join"); |
| } |
| } |
| super.serviceStop(); |
| } |
| |
| /** |
| * Thread that monitors the resource utilization of this node. |
| */ |
| private class MonitoringThread extends Thread { |
| /** |
| * Initialize the node resource monitoring thread. |
| */ |
| public MonitoringThread() { |
| super("Node Resource Monitor"); |
| this.setDaemon(true); |
| } |
| |
| /** |
| * Periodically monitor the resource utilization of the node. |
| */ |
| @Override |
| public void run() { |
| while (true) { |
| // Get node utilization and save it into the health status |
| long pmem = resourceCalculatorPlugin.getPhysicalMemorySize() - |
| resourceCalculatorPlugin.getAvailablePhysicalMemorySize(); |
| long vmem = |
| resourceCalculatorPlugin.getVirtualMemorySize() |
| - resourceCalculatorPlugin.getAvailableVirtualMemorySize(); |
| float vcores = resourceCalculatorPlugin.getNumVCoresUsed(); |
| nodeUtilization = |
| ResourceUtilization.newInstance( |
| (int) (pmem >> 20), // B -> MB |
| (int) (vmem >> 20), // B -> MB |
| vcores); // Used Virtual Cores |
| |
| try { |
| Thread.sleep(monitoringInterval); |
| } catch (InterruptedException e) { |
| LOG.warn(NodeResourceMonitorImpl.class.getName() |
| + " is interrupted. Exiting."); |
| break; |
| } |
| } |
| } |
| } |
| |
| /** |
| * Get the <em>resource utilization</em> of the node. |
| * @return <em>resource utilization</em> of the node. |
| */ |
| @Override |
| public ResourceUtilization getUtilization() { |
| return this.nodeUtilization; |
| } |
| } |