blob: 6be6066de22bc808fe21a9925b5469c9d17c5967 [file] [log] [blame]
* Licensed to the Apache Software Foundation (ASF) under one or more contributor license
* agreements. See the NOTICE file distributed with this work for additional information regarding
* copyright ownership. The ASF licenses this file to You under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance with the License. You may obtain a
* copy of the License at
* Unless required by applicable law or agreed to in writing, software distributed under the License
* is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express
* or implied. See the License for the specific language governing permissions and limitations under
* the License.
package org.apache.geode.cache.wan;
import static com.palantir.docker.compose.execution.DockerComposeExecArgument.arguments;
import static com.palantir.docker.compose.execution.DockerComposeExecOption.options;
import static org.apache.geode.cache.Region.SEPARATOR;
import static org.apache.geode.distributed.ConfigurationProperties.DISTRIBUTED_SYSTEM_ID;
import static org.apache.geode.distributed.ConfigurationProperties.LOCATORS;
import static org.apache.geode.distributed.ConfigurationProperties.REMOTE_LOCATORS;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNotNull;
import java.util.HashMap;
import java.util.Map;
import java.util.Properties;
import java.util.StringTokenizer;
import com.palantir.docker.compose.DockerComposeRule;
import org.junit.BeforeClass;
import org.junit.ClassRule;
import org.junit.Rule;
import org.junit.Test;
import org.junit.experimental.categories.Category;
import org.apache.geode.cache.Cache;
import org.apache.geode.cache.CacheFactory;
import org.apache.geode.cache.PartitionAttributesFactory;
import org.apache.geode.cache.Region;
import org.apache.geode.cache.RegionFactory;
import org.apache.geode.cache.RegionShortcut;
import org.apache.geode.cache.persistence.PartitionOfflineException;
import org.apache.geode.client.sni.NotOnWindowsDockerRule;
import org.apache.geode.distributed.Locator;
import org.apache.geode.internal.cache.ForceReattemptException;
import org.apache.geode.internal.cache.PoolStats;
import org.apache.geode.internal.cache.wan.AbstractGatewaySender;
import org.apache.geode.internal.cache.wan.InternalGatewaySenderFactory;
import org.apache.geode.test.dunit.IgnoredException;
import org.apache.geode.test.dunit.VM;
import org.apache.geode.test.dunit.rules.DistributedRule;
import org.apache.geode.test.junit.categories.WanTest;
* These tests use two Geode sites:
* - One site (the remote one) consisting of a 2-server, 1-locator Geode cluster.
* The servers host a partition region (region-wan) and have gateway senders to receive events
* from the other site with the same value for hostname-for-senders and listening on the
* same port (2324).
* The servers and locator run each inside a Docker container and are not route-able
* from the host (where this JUnit test is running).
* Another Docker container is running the HAProxy image and it's set up as a TCP load balancer.
* The other site connects to the locator and to the gateway receivers via the
* TCP load balancer that forwards traffic directed to the 20334 port to the locator and
* traffic directed to the 2324 port to the receivers in a round robin fashion.
* - Another site consisting of a 1-server, 1-locator Geode cluster.
* The server hosts a partition region (region-wan) and has a parallel gateway receiver
* to send events to the remote site.
* The aim of the tests is verify that when several gateway receivers in a remote site
* share the same port and hostname-for-senders, the pings sent from the gateway senders
* reach the right gateway receiver and not just any of the receivers. Failure to do this
* may result in the closing of connections by a gateway receiver for not having
* received the ping in time.
public class SeveralGatewayReceiversWithSamePortAndHostnameForSendersTest {
private static final int NUM_SERVERS = 2;
private static Cache cache;
private static final URL DOCKER_COMPOSE_PATH =
// Docker compose does not work on windows in CI. Ignore this test on windows
// Using a RuleChain to make sure we ignore the test before the rule comes into play
public static NotOnWindowsDockerRule docker =
new NotOnWindowsDockerRule(() -> DockerComposeRule.builder()
public DistributedRule distributedRule =
DistributedRule.builder().withVMCount(NUM_SERVERS + 1).build();
public static void beforeClass() throws Exception {
// Start locator
docker.get().exec(options("-T"), "locator",
arguments("gfsh", "run", "--file=/geode/scripts/geode-starter-locator.gfsh"));
// Start server1
docker.get().exec(options("-T"), "server1",
arguments("gfsh", "run", "--file=/geode/scripts/geode-starter-server1.gfsh"));
// Start server2
docker.get().exec(options("-T"), "server2",
arguments("gfsh", "run", "--file=/geode/scripts/geode-starter-server2.gfsh"));
// Create partition region and gateway receiver
docker.get().exec(options("-T"), "locator",
arguments("gfsh", "run", "--file=/geode/scripts/geode-starter-create.gfsh"));
public SeveralGatewayReceiversWithSamePortAndHostnameForSendersTest() {
public void testPingsToReceiversWithSamePortAndHostnameForSendersReachTheRightReceivers()
throws InterruptedException {
String senderId = "ln";
String regionName = "region-wan";
final int remoteLocPort = 20334;
int locPort = createLocator(VM.getVM(0), 1, remoteLocPort);
VM vm1 = VM.getVM(1);
createCache(vm1, locPort);
// We must use more than one dispatcher thread. With just one dispatcher thread, only one
// connection will be created by the sender towards one of the receivers and it will be
// monitored by the one ping thread for that remote receiver.
// With more than one thread, several connections will be opened and there should be one ping
// thread per remote receiver.
createGatewaySender(vm1, senderId, 2, true, 5,
createPartitionedRegion(vm1, regionName, senderId, 0, 10);
int NUM_PUTS = 10;
putKeyValues(vm1, NUM_PUTS, regionName);
// Wait longer than the value set in the receivers for
// maximum-time-between-pings: 10000 (see geode-starter-create.gfsh)
// to verify that connections are not closed
// by the receivers because each has received the pings timely.
int maxTimeBetweenPingsInReceiver = 15000;
int senderPoolDisconnects = getSenderPoolDisconnects(vm1, senderId);
assertEquals(0, senderPoolDisconnects);
private int createLocator(VM memberVM, int dsId, int remoteLocPort) {
return memberVM.invoke("create locator", () -> {
Properties props = new Properties();
props.setProperty(DISTRIBUTED_SYSTEM_ID, "" + dsId);
props.setProperty(REMOTE_LOCATORS, "localhost[" + remoteLocPort + "]");
return Locator.startLocatorAndDS(0, new File(""), props)
private static void createCache(VM vm, Integer locPort) {
vm.invoke(() -> {
Properties props = new Properties();
props.setProperty(LOCATORS, "localhost[" + locPort + "]");
CacheFactory cacheFactory = new CacheFactory(props);
cache = cacheFactory.create();
public static void createGatewaySender(VM vm, String dsName, int remoteDsId,
boolean isParallel, Integer batchSize,
int numDispatchers,
GatewaySender.OrderPolicy orderPolicy) {
vm.invoke(() -> {
final IgnoredException exln = IgnoredException.addIgnoredException("Could not connect");
try {
InternalGatewaySenderFactory gateway =
(InternalGatewaySenderFactory) cache.createGatewaySenderFactory();
gateway.create(dsName, remoteDsId);
} finally {
private static void createPartitionedRegion(VM vm, String regionName, String senderIds,
Integer redundantCopies, Integer totalNumBuckets) {
vm.invoke(() -> {
IgnoredException exp =
IgnoredException exp1 =
try {
RegionFactory fact = cache.createRegionFactory(RegionShortcut.PARTITION);
if (senderIds != null) {
StringTokenizer tokenizer = new StringTokenizer(senderIds, ",");
while (tokenizer.hasMoreTokens()) {
String senderId = tokenizer.nextToken();
PartitionAttributesFactory pfact = new PartitionAttributesFactory();
Region r = fact.create(regionName);
} finally {
private static int getSenderPoolDisconnects(VM vm, String senderId) {
return vm.invoke(() -> {
AbstractGatewaySender sender =
(AbstractGatewaySender) CacheFactory.getAnyInstance().getGatewaySender(senderId);
PoolStats poolStats = sender.getProxy().getStats();
return poolStats.getDisConnects();
private static void putKeyValues(VM vm, int numPuts, String region) {
final HashMap<Integer, Integer> keyValues = new HashMap<>();
for (int i = 0; i < numPuts; i++) {
keyValues.put(i, i);
vm.invoke(() -> putGivenKeyValue(region, keyValues));
private static void putGivenKeyValue(String regionName, Map<Integer, Integer> keyValues) {
Region<Integer, Integer> r = cache.getRegion(SEPARATOR + regionName);
for (Object key : keyValues.keySet()) {
r.put((Integer) key, keyValues.get(key));