| // Licensed to the Apache Software Foundation (ASF) under one |
| // or more contributor license agreements. See the NOTICE file |
| // distributed with this work for additional information |
| // regarding copyright ownership. The ASF licenses this file |
| // to you under the Apache License, Version 2.0 (the |
| // "License"); you may not use this file except in compliance |
| // with the License. You may obtain a copy of the License at |
| // |
| // http://www.apache.org/licenses/LICENSE-2.0 |
| // |
| // Unless required by applicable law or agreed to in writing, |
| // software distributed under the License is distributed on an |
| // "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY |
| // KIND, either express or implied. See the License for the |
| // specific language governing permissions and limitations |
| // under the License. |
| package com.cloud.hypervisor.kvm.resource; |
| |
| import com.cloud.utils.script.Script; |
| import org.apache.cloudstack.managed.context.ManagedContextRunnable; |
| import org.apache.log4j.Logger; |
| import org.libvirt.Connect; |
| import org.libvirt.LibvirtException; |
| import org.libvirt.StoragePool; |
| import org.libvirt.StoragePoolInfo.StoragePoolState; |
| |
| import java.util.ArrayList; |
| import java.util.HashSet; |
| import java.util.List; |
| import java.util.Map; |
| import java.util.Set; |
| import java.util.concurrent.ConcurrentHashMap; |
| |
| public class KVMHAMonitor extends KVMHABase implements Runnable { |
| private static final Logger s_logger = Logger.getLogger(KVMHAMonitor.class); |
| private final Map<String, NfsStoragePool> _storagePool = new ConcurrentHashMap<String, NfsStoragePool>(); |
| |
| private final String _hostIP; /* private ip address */ |
| |
| public KVMHAMonitor(NfsStoragePool pool, String host, String scriptPath) { |
| if (pool != null) { |
| _storagePool.put(pool._poolUUID, pool); |
| } |
| _hostIP = host; |
| configureHeartBeatPath(scriptPath); |
| } |
| |
| private static synchronized void configureHeartBeatPath(String scriptPath) { |
| KVMHABase.s_heartBeatPath = scriptPath; |
| } |
| |
| public void addStoragePool(NfsStoragePool pool) { |
| synchronized (_storagePool) { |
| _storagePool.put(pool._poolUUID, pool); |
| } |
| } |
| |
| public void removeStoragePool(String uuid) { |
| synchronized (_storagePool) { |
| NfsStoragePool pool = _storagePool.get(uuid); |
| if (pool != null) { |
| Script.runSimpleBashScript("umount " + pool._mountDestPath); |
| _storagePool.remove(uuid); |
| } |
| } |
| } |
| |
| public List<NfsStoragePool> getStoragePools() { |
| synchronized (_storagePool) { |
| return new ArrayList<NfsStoragePool>(_storagePool.values()); |
| } |
| } |
| |
| public NfsStoragePool getStoragePool(String uuid) { |
| synchronized (_storagePool) { |
| return _storagePool.get(uuid); |
| } |
| } |
| |
| private class Monitor extends ManagedContextRunnable { |
| |
| @Override |
| protected void runInContext() { |
| synchronized (_storagePool) { |
| Set<String> removedPools = new HashSet<String>(); |
| for (String uuid : _storagePool.keySet()) { |
| NfsStoragePool primaryStoragePool = _storagePool.get(uuid); |
| |
| // check for any that have been deregistered with libvirt and |
| // skip,remove them |
| |
| StoragePool storage = null; |
| try { |
| Connect conn = LibvirtConnection.getConnection(); |
| storage = conn.storagePoolLookupByUUIDString(uuid); |
| if (storage == null) { |
| s_logger.debug("Libvirt storage pool " + uuid + " not found, removing from HA list"); |
| removedPools.add(uuid); |
| continue; |
| |
| } else if (storage.getInfo().state != StoragePoolState.VIR_STORAGE_POOL_RUNNING) { |
| s_logger.debug("Libvirt storage pool " + uuid + " found, but not running, removing from HA list"); |
| |
| removedPools.add(uuid); |
| continue; |
| } |
| s_logger.debug("Found NFS storage pool " + uuid + " in libvirt, continuing"); |
| |
| } catch (LibvirtException e) { |
| s_logger.debug("Failed to lookup libvirt storage pool " + uuid + " due to: " + e); |
| |
| // we only want to remove pool if it's not found, not if libvirt |
| // connection fails |
| if (e.toString().contains("pool not found")) { |
| s_logger.debug("removing pool from HA monitor since it was deleted"); |
| removedPools.add(uuid); |
| continue; |
| } |
| } |
| |
| String result = null; |
| // Try multiple times, but sleep in between tries to ensure it isn't a short lived transient error |
| for (int i = 1; i <= _heartBeatUpdateMaxTries; i++) { |
| Script cmd = new Script(s_heartBeatPath, _heartBeatUpdateTimeout, s_logger); |
| cmd.add("-i", primaryStoragePool._poolIp); |
| cmd.add("-p", primaryStoragePool._poolMountSourcePath); |
| cmd.add("-m", primaryStoragePool._mountDestPath); |
| cmd.add("-h", _hostIP); |
| result = cmd.execute(); |
| if (result != null) { |
| s_logger.warn("write heartbeat failed: " + result + ", try: " + i + " of " + _heartBeatUpdateMaxTries); |
| try { |
| Thread.sleep(_heartBeatUpdateRetrySleep); |
| } catch (InterruptedException e) { |
| s_logger.debug("[ignored] interupted between heartbeat retries."); |
| } |
| } else { |
| break; |
| } |
| } |
| |
| if (result != null) { |
| // Stop cloudstack-agent if can't write to heartbeat file. |
| // This will raise an alert on the mgmt server |
| s_logger.warn("write heartbeat failed: " + result + "; stopping cloudstack-agent"); |
| Script cmd = new Script(s_heartBeatPath, _heartBeatUpdateTimeout, s_logger); |
| cmd.add("-i", primaryStoragePool._poolIp); |
| cmd.add("-p", primaryStoragePool._poolMountSourcePath); |
| cmd.add("-m", primaryStoragePool._mountDestPath); |
| cmd.add("-c"); |
| result = cmd.execute(); |
| } |
| } |
| |
| if (!removedPools.isEmpty()) { |
| for (String uuid : removedPools) { |
| removeStoragePool(uuid); |
| } |
| } |
| } |
| |
| } |
| } |
| |
| @Override |
| public void run() { |
| // s_logger.addAppender(new org.apache.log4j.ConsoleAppender(new |
| // org.apache.log4j.PatternLayout(), "System.out")); |
| while (true) { |
| Thread monitorThread = new Thread(new Monitor()); |
| monitorThread.start(); |
| try { |
| monitorThread.join(); |
| } catch (InterruptedException e) { |
| s_logger.debug("[ignored] interupted joining monitor."); |
| } |
| |
| try { |
| Thread.sleep(_heartBeatUpdateFreq); |
| } catch (InterruptedException e) { |
| s_logger.debug("[ignored] interupted between heartbeats."); |
| } |
| } |
| } |
| |
| } |