blob: bce130d843600061b199f42b82ef027746d9ceae [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.accumulo.test;
import static com.google.common.util.concurrent.Uninterruptibles.sleepUninterruptibly;
import static org.apache.accumulo.minicluster.ServerType.TABLET_SERVER;
import static org.junit.Assert.assertEquals;
import java.util.concurrent.TimeUnit;
import org.apache.accumulo.core.client.Accumulo;
import org.apache.accumulo.core.client.AccumuloClient;
import org.apache.accumulo.core.clientImpl.ClientContext;
import org.apache.accumulo.core.clientImpl.ManagerClient;
import org.apache.accumulo.core.clientImpl.thrift.ThriftNotActiveServiceException;
import org.apache.accumulo.core.conf.ClientProperty;
import org.apache.accumulo.core.conf.Property;
import org.apache.accumulo.core.master.thrift.ManagerClientService.Client;
import org.apache.accumulo.core.master.thrift.ManagerMonitorInfo;
import org.apache.accumulo.core.metadata.MetadataTable;
import org.apache.accumulo.core.security.Authorizations;
import org.apache.accumulo.core.trace.TraceUtil;
import org.apache.accumulo.fate.util.UtilWaitThread;
import org.apache.accumulo.miniclusterImpl.MiniAccumuloConfigImpl;
import org.apache.accumulo.test.functional.ConfigurableMacBase;
import org.apache.hadoop.conf.Configuration;
import org.junit.Test;
import com.google.common.collect.Iterators;
public class DetectDeadTabletServersIT extends ConfigurableMacBase {
@Override
protected void configure(MiniAccumuloConfigImpl cfg, Configuration hadoopCoreSite) {
cfg.setProperty(Property.INSTANCE_ZK_TIMEOUT, "15s");
cfg.setClientProperty(ClientProperty.INSTANCE_ZOOKEEPERS_TIMEOUT, "15s");
}
@Test
public void test() throws Exception {
try (AccumuloClient c = Accumulo.newClient().from(getClientProperties()).build()) {
log.info("verifying that everything is up");
Iterators.size(c.createScanner(MetadataTable.NAME, Authorizations.EMPTY).iterator());
ManagerMonitorInfo stats = getStats(c);
assertEquals(2, stats.tServerInfo.size());
assertEquals(0, stats.badTServers.size());
assertEquals(0, stats.deadTabletServers.size());
log.info("Killing a tablet server");
getCluster().killProcess(TABLET_SERVER,
getCluster().getProcesses().get(TABLET_SERVER).iterator().next());
while (true) {
stats = getStats(c);
if (stats.tServerInfo.size() != 2) {
break;
}
UtilWaitThread.sleep(500);
}
assertEquals(1, stats.tServerInfo.size());
assertEquals(1, stats.badTServers.size() + stats.deadTabletServers.size());
while (true) {
stats = getStats(c);
if (!stats.deadTabletServers.isEmpty()) {
break;
}
UtilWaitThread.sleep(500);
}
assertEquals(1, stats.tServerInfo.size());
assertEquals(0, stats.badTServers.size());
assertEquals(1, stats.deadTabletServers.size());
}
}
private ManagerMonitorInfo getStats(AccumuloClient c) throws Exception {
ClientContext context = (ClientContext) c;
Client client = null;
while (true) {
try {
client = ManagerClient.getConnectionWithRetry(context);
log.info("Fetching manager stats");
return client.getManagerStats(TraceUtil.traceInfo(), context.rpcCreds());
} catch (ThriftNotActiveServiceException e) {
// Let it loop, fetching a new location
sleepUninterruptibly(100, TimeUnit.MILLISECONDS);
} finally {
if (client != null) {
ManagerClient.close(client);
}
}
}
}
}