modules/core/src/main/java/org/apache/ignite/IgniteCluster.java - ignite - Git at Google

 /*
  * Licensed to the Apache Software Foundation (ASF) under one or more
  * contributor license agreements.  See the NOTICE file distributed with
  * this work for additional information regarding copyright ownership.
  * The ASF licenses this file to You under the Apache License, Version 2.0
  * (the "License"); you may not use this file except in compliance with
  * the License.  You may obtain a copy of the License at
  *
  *      http://www.apache.org/licenses/LICENSE-2.0
  *
  * Unless required by applicable law or agreed to in writing, software
  * distributed under the License is distributed on an "AS IS" BASIS,
  * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  * See the License for the specific language governing permissions and
  * limitations under the License.
  */

 package org.apache.ignite;

 import java.io.File;
 import java.util.Collection;
 import java.util.Map;
 import java.util.UUID;
 import java.util.concurrent.ConcurrentMap;
 import org.apache.ignite.cluster.BaselineNode;
 import org.apache.ignite.cluster.ClusterGroup;
 import org.apache.ignite.cluster.ClusterNode;
 import org.apache.ignite.cluster.ClusterStartNodeResult;
 import org.apache.ignite.cluster.ClusterState;
 import org.apache.ignite.configuration.IgniteConfiguration;
 import org.apache.ignite.internal.processors.cluster.baseline.autoadjust.BaselineAutoAdjustStatus;
 import org.apache.ignite.lang.IgniteAsyncSupport;
 import org.apache.ignite.lang.IgniteAsyncSupported;
 import org.apache.ignite.lang.IgniteFuture;
 import org.jetbrains.annotations.Nullable;

 /**
  * Represents whole cluster (all available nodes) and also provides a handle on {@link #nodeLocalMap()} which
  * provides map-like functionality linked to current grid node. Node-local map is useful for saving shared state
  * between job executions on the grid. Additionally you can also ping, start, and restart remote nodes, map keys to
  * caching nodes, and get other useful information about topology.
  */
 public interface IgniteCluster extends ClusterGroup, IgniteAsyncSupport {
     /**
      * Maximum length of {@link IgniteCluster#tag()} tag.
      */
     public static final int MAX_TAG_LENGTH = 280;

     /**
      * Gets local grid node.
      *
      * @return Local grid node.
      */
     public ClusterNode localNode();

     /**
      * Gets a cluster group consisting from the local node.
      *
      * @return Cluster group consisting from the local node.
      */
     public ClusterGroup forLocal();

     /**
      * Gets node-local storage instance.
      * <p>
      * Node-local values are similar to thread locals in a way that these values are not
      * distributed and kept only on local node (similar like thread local values are attached to the
      * current thread only). Node-local values are used primarily by closures executed from the remote
      * nodes to keep intermediate state on the local node between executions.
      * <p>
      * There's only one instance of node local storage per local node. Node local storage is
      * based on {@link java.util.concurrent.ConcurrentMap} and is safe for multi-threaded access.
      *
      * @param <K> Type of keys in the node local map.
      * @param <V> Type of mapped values in the node local map.
      * @return Node local storage instance for the local node.
      */
     public <K, V> ConcurrentMap<K, V> nodeLocalMap();

     /**
      * Pings a remote node.
      * <p>
      * Discovery SPIs usually have some latency in discovering failed nodes. Hence,
      * communication to remote nodes may fail at times if an attempt was made to
      * establish communication with a failed node. This method can be used to check
      * if communication has failed due to node failure or due to some other reason.
      *
      * @param nodeId ID of a node to ping.
      * @return {@code true} if node for a given ID is alive, {@code false} otherwise.
      * @see org.apache.ignite.spi.discovery.DiscoverySpi
      */
     public boolean pingNode(UUID nodeId);

     /**
      * Gets current topology version. In case of TCP discovery
      * (see {@link org.apache.ignite.spi.discovery.tcp.TcpDiscoverySpi}) topology versions
      * are sequential - they start from {@code '1'} and get incremented every time whenever a
      * node joins or leaves. For other discovery SPIs topology versions may not be (and likely are
      * not) sequential.
      *
      * @return Current topology version.
      */
     public long topologyVersion();

     /**
      * Gets a topology by version. Returns {@code null} if topology history storage doesn't contain
      * specified topology version (history currently keeps last {@code 1000} snapshots).
      *
      * @param topVer Topology version.
      * @return Collection of grid nodes which represented by specified topology version,
      * if it is present in history storage, {@code null} otherwise.
      * @throws UnsupportedOperationException If underlying SPI implementation does not support
      *      topology history. Currently only {@link org.apache.ignite.spi.discovery.tcp.TcpDiscoverySpi}
      *      supports topology history.
      */
     public Collection<ClusterNode> topology(long topVer) throws UnsupportedOperationException;

     /**
      * Starts one or more nodes on remote host(s).
      * <p>
      * This method takes INI file which defines all startup parameters. It can contain one or
      * more sections, each for a host or for range of hosts (note that they must have different
      * names) and a special '{@code defaults}' section with default values. They are applied to
      * undefined parameters in host's sections.
      * <p>
      * Returned result is collection of tuples. Each tuple corresponds to one node start attempt and
      * contains hostname, success flag and error message if attempt was not successful. Note that
      * successful attempt doesn't mean that node was actually started and joined topology. For large
      * topologies (> 100s nodes) it can take over 10 minutes for all nodes to start. See individual
      * node logs for details.
      * <p>
      * Supports asynchronous execution (see {@link IgniteAsyncSupport}).
      *
      * @param file Configuration file.
      * @param restart Whether to stop existing nodes. If {@code true}, all existing
      *      nodes on the host will be stopped before starting new ones. If
      *      {@code false}, nodes will be started only if there are less
      *      nodes on the host than expected.
      * @param timeout Connection timeout.
      * @param maxConn Number of parallel SSH connections to one host.
      * @return Collection of start node results, each containing host name, result (success or failure)
      *      and error message (if any).
      * @throws IgniteException In case of error.
      */
     @IgniteAsyncSupported
     public Collection<ClusterStartNodeResult> startNodes(File file, boolean restart, int timeout,
         int maxConn) throws IgniteException;

     /**
      * Starts one or more nodes on remote host(s) asynchronously.
      * <p>
      * This method takes INI file which defines all startup parameters. It can contain one or
      * more sections, each for a host or for range of hosts (note that they must have different
      * names) and a special '{@code defaults}' section with default values. They are applied to
      * undefined parameters in host's sections.
      * <p>
      * Completed future contains collection of tuples. Each tuple corresponds to one node start attempt and
      * contains hostname, success flag and error message if attempt was not successful. Note that
      * successful attempt doesn't mean that node was actually started and joined topology. For large
      * topologies (> 100s nodes) it can take over 10 minutes for all nodes to start. See individual
      * node logs for details.
      *
      * @param file Configuration file.
      * @param restart Whether to stop existing nodes. If {@code true}, all existing
      *      nodes on the host will be stopped before starting new ones. If
      *      {@code false}, nodes will be started only if there are less
      *      nodes on the host than expected.
      * @param timeout Connection timeout.
      * @param maxConn Number of parallel SSH connections to one host.
      * @return a Future representing pending completion of the starting nodes.
      * @throws IgniteException In case of error.
      */
     public IgniteFuture<Collection<ClusterStartNodeResult>> startNodesAsync(File file, boolean restart, int timeout,
         int maxConn) throws IgniteException;

     /**
      * Starts one or more nodes on remote host(s).
      * <p>
      * Each map in {@code hosts} collection
      * defines startup parameters for one host or for a range of hosts. The following
      * parameters are supported:
      *     <table class="doctable">
      *         <tr>
      *             <th>Name</th>
      *             <th>Type</th>
      *             <th>Description</th>
      *         </tr>
      *         <tr>
      *             <td><b>host</b></td>
      *             <td>String</td>
      *             <td>
      *                 Hostname (required). Can define several hosts if their IPs are sequential.
      *                 E.g., {@code 10.0.0.1~5} defines range of five IP addresses. Other
      *                 parameters are applied to all hosts equally.
      *             </td>
      *         </tr>
      *         <tr>
      *             <td><b>port</b></td>
      *             <td>Integer</td>
      *             <td>Port number (default is {@code 22}).</td>
      *         </tr>
      *         <tr>
      *             <td><b>uname</b></td>
      *             <td>String</td>
      *             <td>Username (if not defined, current local username will be used).</td>
      *         </tr>
      *         <tr>
      *             <td><b>passwd</b></td>
      *             <td>String</td>
      *             <td>Password (if not defined, private key file must be defined).</td>
      *         </tr>
      *         <tr>
      *             <td><b>key</b></td>
      *             <td>File</td>
      *             <td>Private key file (if not defined, password must be defined).</td>
      *         </tr>
      *         <tr>
      *             <td><b>nodes</b></td>
      *             <td>Integer</td>
      *             <td>
      *                 Expected number of nodes on the host. If some nodes are started
      *                 already, then only remaining nodes will be started. If current count of
      *                 nodes is equal to this number, and {@code restart} flag is {@code false},
      *                 then nothing will happen.
      *             </td>
      *         </tr>
      *         <tr>
      *             <td><b>igniteHome</b></td>
      *             <td>String</td>
      *             <td>
      *                 Path to Ignite installation folder. If not defined, IGNITE_HOME
      *                 environment variable must be set on remote hosts.
      *             </td>
      *         </tr>
      *         <tr>
      *             <td><b>cfg</b></td>
      *             <td>String</td>
      *             <td>Path to configuration file (relative to {@code igniteHome}).</td>
      *         </tr>
      *         <tr>
      *             <td><b>script</b></td>
      *             <td>String</td>
      *             <td>
      *                 Custom startup script file name and path (relative to {@code igniteHome}).
      *                 You can also specify a space-separated list of parameters in the same
      *                 string (for example: {@code "bin/my-custom-script.sh -v"}).
      *             </td>
      *         </tr>
      *     </table>
      * <p>
      * {@code dflts} map defines default values. They are applied to undefined parameters in
      * {@code hosts} collection.
      * <p>
      * Returned result is collection of tuples. Each tuple corresponds to one node start attempt and
      * contains hostname, success flag and error message if attempt was not successful. Note that
      * successful attempt doesn't mean that node was actually started and joined topology. For large
      * topologies (> 100s nodes) it can take over 10 minutes for all nodes to start. See individual
      * node logs for details.
      * <p>
      * Supports asynchronous execution (see {@link IgniteAsyncSupport}).
      *
      * @param hosts Startup parameters.
      * @param dflts Default values.
      * @param restart Whether to stop existing nodes. If {@code true}, all existing
      *      nodes on the host will be stopped before starting new ones. If
      *      {@code false}, nodes will be started only if there are less
      *      nodes on the host than expected.
      * @param timeout Connection timeout in milliseconds.
      * @param maxConn Number of parallel SSH connections to one host.
      * @return Collection of start node results, each containing host name, result (success or failure)
      *      and error message (if any).
      * @throws IgniteException In case of error.
      */
     @IgniteAsyncSupported
     public Collection<ClusterStartNodeResult> startNodes(Collection<Map<String, Object>> hosts,
         @Nullable Map<String, Object> dflts, boolean restart, int timeout, int maxConn) throws IgniteException;

     /**
      * Starts one or more nodes on remote host(s) asynchronously.
      * <p>
      * Each map in {@code hosts} collection
      * defines startup parameters for one host or for a range of hosts. The following
      * parameters are supported:
      *     <table class="doctable">
      *         <tr>
      *             <th>Name</th>
      *             <th>Type</th>
      *             <th>Description</th>
      *         </tr>
      *         <tr>
      *             <td><b>host</b></td>
      *             <td>String</td>
      *             <td>
      *                 Hostname (required). Can define several hosts if their IPs are sequential.
      *                 E.g., {@code 10.0.0.1~5} defines range of five IP addresses. Other
      *                 parameters are applied to all hosts equally.
      *             </td>
      *         </tr>
      *         <tr>
      *             <td><b>port</b></td>
      *             <td>Integer</td>
      *             <td>Port number (default is {@code 22}).</td>
      *         </tr>
      *         <tr>
      *             <td><b>uname</b></td>
      *             <td>String</td>
      *             <td>Username (if not defined, current local username will be used).</td>
      *         </tr>
      *         <tr>
      *             <td><b>passwd</b></td>
      *             <td>String</td>
      *             <td>Password (if not defined, private key file must be defined).</td>
      *         </tr>
      *         <tr>
      *             <td><b>key</b></td>
      *             <td>File</td>
      *             <td>Private key file (if not defined, password must be defined).</td>
      *         </tr>
      *         <tr>
      *             <td><b>nodes</b></td>
      *             <td>Integer</td>
      *             <td>
      *                 Expected number of nodes on the host. If some nodes are started
      *                 already, then only remaining nodes will be started. If current count of
      *                 nodes is equal to this number, and {@code restart} flag is {@code false},
      *                 then nothing will happen.
      *             </td>
      *         </tr>
      *         <tr>
      *             <td><b>igniteHome</b></td>
      *             <td>String</td>
      *             <td>
      *                 Path to Ignite installation folder. If not defined, IGNITE_HOME
      *                 environment variable must be set on remote hosts.
      *             </td>
      *         </tr>
      *         <tr>
      *             <td><b>cfg</b></td>
      *             <td>String</td>
      *             <td>Path to configuration file (relative to {@code igniteHome}).</td>
      *         </tr>
      *         <tr>
      *             <td><b>script</b></td>
      *             <td>String</td>
      *             <td>
      *                 Custom startup script file name and path (relative to {@code igniteHome}).
      *                 You can also specify a space-separated list of parameters in the same
      *                 string (for example: {@code "bin/my-custom-script.sh -v"}).
      *             </td>
      *         </tr>
      *     </table>
      * <p>
      * {@code dflts} map defines default values. They are applied to undefined parameters in
      * {@code hosts} collection.
      * <p>
      * Completed future contains collection of tuples. Each tuple corresponds to one node start attempt and
      * contains hostname, success flag and error message if attempt was not successful. Note that
      * successful attempt doesn't mean that node was actually started and joined topology. For large
      * topologies (> 100s nodes) it can take over 10 minutes for all nodes to start. See individual
      * node logs for details.
      *
      * @param hosts Startup parameters.
      * @param dflts Default values.
      * @param restart Whether to stop existing nodes. If {@code true}, all existing
      *      nodes on the host will be stopped before starting new ones. If
      *      {@code false}, nodes will be started only if there are less
      *      nodes on the host than expected.
      * @param timeout Connection timeout in milliseconds.
      * @param maxConn Number of parallel SSH connections to one host.
      * @return a Future representing pending completion of the starting nodes.
      * @throws IgniteException In case of error.
      */
     public IgniteFuture<Collection<ClusterStartNodeResult>> startNodesAsync(Collection<Map<String, Object>> hosts,
         @Nullable Map<String, Object> dflts, boolean restart, int timeout, int maxConn) throws IgniteException;

     /**
      * Stops nodes satisfying optional set of predicates.
      * <p>
      * <b>NOTE:</b> {@code System.exit(Ignition.KILL_EXIT_CODE)} will be executed on each
      * stopping node. If you have other applications running in the same JVM along with Ignition,
      * those applications will be stopped as well.
      *
      * @throws IgniteException In case of error.
      */
     public void stopNodes() throws IgniteException;

     /**
      * Stops nodes defined by provided IDs.
      * <p>
      * <b>NOTE:</b> {@code System.exit(Ignition.KILL_EXIT_CODE)} will be executed on each
      * stopping node. If you have other applications running in the same JVM along with Ignition,
      * those applications will be stopped as well.
      *
      * @param ids IDs defining nodes to stop.
      * @throws IgniteException In case of error.
      */
     public void stopNodes(Collection<UUID> ids) throws IgniteException;

     /**
      * Restarts nodes satisfying optional set of predicates.
      * <p>
      * <b>NOTE:</b> this command only works for grid nodes started with Ignition
      * {@code ignite.sh} or {@code ignite.bat} scripts.
      *
      * @throws IgniteException In case of error.
      */
     public void restartNodes() throws IgniteException;

     /**
      * Restarts nodes defined by provided IDs.
      * <p>
      * <b>NOTE:</b> this command only works for grid nodes started with Ignition
      * {@code ignite.sh} or {@code ignite.bat} scripts.
      *
      * @param ids IDs defining nodes to restart.
      * @throws IgniteException In case of error.
      */
     public void restartNodes(Collection<UUID> ids) throws IgniteException;

     /**
      * Resets local I/O, job, and task execution metrics.
      */
     public void resetMetrics();

     /**
      * Enables/disables statistics for caches cluster wide.
      *
      * @param caches Collection of cache names.
      * @param enabled Statistics enabled flag.
      */
     public void enableStatistics(Collection<String> caches, boolean enabled);

     /**
      * Clear statistics for caches cluster wide.
      *
      * @param caches Collection of cache names.
      */
     public void clearStatistics(Collection<String> caches);

     /**
      * Sets transaction timeout on partition map exchange.
      *
      * @param timeout Transaction timeout on partition map exchange in milliseconds.
      */
     public void setTxTimeoutOnPartitionMapExchange(long timeout);

     /**
      * If local client node disconnected from cluster returns future
      * that will be completed when client reconnected.
      *
      * @return Future that will be completed when client reconnected.
      */
     @Nullable public IgniteFuture<?> clientReconnectFuture();

     /**
      * Checks Ignite grid is active or not active.
      *
      * @return {@code True} if grid is active. {@code False} If grid is not active.
      * @deprecated Use {@link #state()} instead.
      */
     @Deprecated
     public boolean active();

     /**
      * Changes Ignite grid state to active or inactive.
      * <p>
      * <b>NOTE:</b>
      * Deactivation clears in-memory caches (without persistence) including the system caches.
      *
      * @param active If {@code True} start activation process. If {@code False} start deactivation process.
      * @throws IgniteException If there is an already started transaction or lock in the same thread.
      * @deprecated Use {@link #state(ClusterState)} instead.
      */
     @Deprecated
     public void active(boolean active);

     /**
      * Gets current cluster state.
      *
      * @return Current cluster state.
      */
     public ClusterState state();

     /**
      * Changes current cluster state to given {@code newState} cluster state.
      * <p>
      * <b>NOTE:</b>
      * Deactivation clears in-memory caches (without persistence) including the system caches.
      *
      * @param newState New cluster state.
      * @throws IgniteException If there is an already started transaction or lock in the same thread.
      */
     public void state(ClusterState newState) throws IgniteException;

     /**
      * Gets current baseline topology. If baseline topology was not set, will return {@code null}.
      *
      * @return Collection of nodes included to the current baseline topology.
      */
     @Nullable public Collection<BaselineNode> currentBaselineTopology();

     /**
      * Sets baseline topology. The cluster must be activated for this method to be called.
      *
      * @param baselineTop A collection of nodes to be included to the baseline topology.
      */
     public void setBaselineTopology(Collection<? extends BaselineNode> baselineTop);

     /**
      * Sets baseline topology constructed from the cluster topology of the given version (the method succeeds
      * only if the cluster topology has not changed). All client and daemon nodes will be filtered out of the
      * resulting baseline.
      *
      * @param topVer Topology version to set.
      */
     public void setBaselineTopology(long topVer);

     /** {@inheritDoc} */
     @Deprecated
     @Override public IgniteCluster withAsync();

     /**
      * Disables write-ahead logging for specified cache. When WAL is disabled, changes are not logged to disk.
      * This significantly improves cache update speed. The drawback is absence of local crash-recovery guarantees.
      * If node is crashed, local content of WAL-disabled cache will be cleared on restart to avoid data corruption.
      * <p>
      * Internally this method will wait for all current cache operations to finish and prevent new cache operations
      * from being executed. Then checkpoint is initiated to flush all data to disk. Control is returned to the callee
      * when all dirty pages are prepared for checkpoint, but not necessarily flushed to disk.
      * <p>
      * WAL state can be changed only for persistent caches.
      * <p>
      * <b>NOTE:</b>
      * Currently, this method should only be called on a stable topology when no nodes are leaving or joining cluster,
      * and all baseline nodes are present.
      * Cache may be stuck in inconsistent state due to violation of these conditions. It is advised to destroy
      * such cache.
      *
      * @param cacheName Cache name.
      * @return Whether WAL disabled by this call.
      * @throws IgniteException If error occurs.
      * @see #enableWal(String)
      * @see #isWalEnabled(String)
      */
     public boolean disableWal(String cacheName) throws IgniteException;

     /**
      * Enables write-ahead logging for specified cache. Restoring crash-recovery guarantees of a previous call to
      * {@link #disableWal(String)}.
      * <p>
      * Internally this method will wait for all current cache operations to finish and prevent new cache operations
      * from being executed. Then checkpoint is initiated to flush all data to disk. Control is returned to the callee
      * when all data is persisted to disk.
      * <p>
      * WAL state can be changed only for persistent caches.
      * <p>
      * <b>NOTE:</b>
      * Currently, this method should only be called on a stable topology when no nodes are leaving or joining cluster,
      * and all baseline nodes are present.
      * Cache may be stuck in inconsistent state due to violation of these conditions. It is advised to destroy
      * such cache.
      *
      * @param cacheName Cache name.
      * @return Whether WAL enabled by this call.
      * @throws IgniteException If error occurs.
      * @see #disableWal(String)
      * @see #isWalEnabled(String)
      */
     public boolean enableWal(String cacheName) throws IgniteException;

     /**
      * Checks if write-ahead logging is enabled for specified cache.
      *
      * @param cacheName Cache name.
      * @return {@code True} if WAL is enabled for cache.
      * @see #disableWal(String)
      * @see #enableWal(String)
      */
     public boolean isWalEnabled(String cacheName);

     /**
      * Cluster ID is a unique identifier automatically generated when cluster starts up for the very first time.
      *
      * It is a cluster-wide property so all nodes of the cluster (including client nodes) return the same value.
      *
      * In in-memory clusters ID is generated again upon each cluster restart.
      * In clusters running in persistent mode cluster ID is stored to disk and is used even after full cluster restart.
      *
      * @return Unique cluster ID.
      */
     public UUID id();

     /**
      * User-defined tag describing the cluster.
      *
      * @return Current tag value same across all nodes of the cluster.
      */
     public String tag();

     /**
      * Enables user to add a specific label to the cluster e.g. to describe purpose of the cluster
      * or any its characteristics.
      * Tag is set cluster-wide,
      * value set on one node will be distributed across all nodes (including client nodes) in the cluster.
      *
      * Maximum tag length is limited by {@link #MAX_TAG_LENGTH} value.
      *
      * @param tag New tag to be set.
      *
      * @throws IgniteCheckedException In case tag change is requested on inactive cluster
      *  or concurrent tag change request was completed before the current one.
      *  Also provided tag is checked for max length.
      */
     public void tag(String tag) throws IgniteCheckedException;

     /**
      * @return Value of manual baseline control or auto adjusting baseline. {@code True} If cluster in auto-adjust.
      * {@code False} If cluster in manual.
      */
     public boolean isBaselineAutoAdjustEnabled();

     /**
      * @param baselineAutoAdjustEnabled Value of manual baseline control or auto adjusting baseline. {@code True} If
      * cluster in auto-adjust. {@code False} If cluster in manuale.
      * @throws IgniteException If operation failed.
      */
     public void baselineAutoAdjustEnabled(boolean baselineAutoAdjustEnabled) throws IgniteException;

     /**
      * @return Value of time which we would wait before the actual topology change since last server topology change
      * (node join/left/fail).
      * @throws IgniteException If operation failed.
      */
     public long baselineAutoAdjustTimeout();

     /**
      * @param baselineAutoAdjustTimeout Value of time which we would wait before the actual topology change since last
      * server topology change (node join/left/fail).
      * @throws IgniteException If failed.
      */
     public void baselineAutoAdjustTimeout(long baselineAutoAdjustTimeout) throws IgniteException;

     /**
      * @return Status of baseline auto-adjust.
      */
     public BaselineAutoAdjustStatus baselineAutoAdjustStatus();

     /**
      * Returns a policy of shutdown or default value {@code IgniteConfiguration.DFLT_SHUTDOWN_POLICY}
      * if the property is not set.
      *
      * @return Shutdown policy.
      */
     public ShutdownPolicy shutdownPolicy();

     /**
      * Sets a shutdown policy on a cluster.
      * If a policy is specified here the value will override static configuration on
      * {@link IgniteConfiguration#setShutdownPolicy(ShutdownPolicy)} and persists to cluster meta storage.
      *
      * @param shutdownPolicy Shutdown policy.
      */
     public void shutdownPolicy(ShutdownPolicy shutdownPolicy);
 }