blob: e89d673875fc2a9d9e2736cce7757409314c08bc [file] [log] [blame]
/*
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.samza.container.grouper.task;
import org.apache.samza.SamzaException;
import org.apache.samza.container.LocalityManager;
import org.apache.samza.job.model.ContainerModel;
import org.apache.samza.job.model.TaskModel;
import org.junit.Before;
import org.junit.Test;
import java.util.Collections;
import java.util.HashMap;
import java.util.HashSet;
import java.util.Map;
import java.util.Set;
import java.util.UUID;
import static org.apache.samza.container.mock.ContainerMocks.generateTaskContainerMapping;
import static org.apache.samza.container.mock.ContainerMocks.generateTaskModels;
import static org.apache.samza.container.mock.ContainerMocks.getTaskModel;
import static org.apache.samza.container.mock.ContainerMocks.getTaskName;
import static org.junit.Assert.assertEquals;
import static org.junit.Assert.assertNotNull;
import static org.junit.Assert.assertTrue;
import static org.mockito.Mockito.anyCollection;
import static org.mockito.Mockito.anyString;
import static org.mockito.Mockito.mock;
import static org.mockito.Mockito.never;
import static org.mockito.Mockito.verify;
import static org.mockito.Mockito.when;
public class TestGroupByContainerCount {
private TaskAssignmentManager taskAssignmentManager;
private LocalityManager localityManager;
@Before
public void setup() {
taskAssignmentManager = mock(TaskAssignmentManager.class);
localityManager = mock(LocalityManager.class);
when(localityManager.getTaskAssignmentManager()).thenReturn(taskAssignmentManager);
}
@Test(expected = IllegalArgumentException.class)
public void testGroupEmptyTasks() {
new GroupByContainerCount(1).group(new HashSet());
}
@Test(expected = IllegalArgumentException.class)
public void testGroupFewerTasksThanContainers() {
Set<TaskModel> taskModels = new HashSet<>();
taskModels.add(getTaskModel(1));
new GroupByContainerCount(2).group(taskModels);
}
@Test(expected = UnsupportedOperationException.class)
public void testGrouperResultImmutable() {
Set<TaskModel> taskModels = generateTaskModels(3);
Set<ContainerModel> containers = new GroupByContainerCount(3).group(taskModels);
containers.remove(containers.iterator().next());
}
@Test
public void testGroupHappyPath() {
Set<TaskModel> taskModels = generateTaskModels(5);
Set<ContainerModel> containers = new GroupByContainerCount(2).group(taskModels);
Map<String, ContainerModel> containersMap = new HashMap<>();
for (ContainerModel container : containers) {
containersMap.put(container.getProcessorId(), container);
}
assertEquals(2, containers.size());
ContainerModel container0 = containersMap.get("0");
ContainerModel container1 = containersMap.get("1");
assertNotNull(container0);
assertNotNull(container1);
assertEquals("0", container0.getProcessorId());
assertEquals("1", container1.getProcessorId());
assertEquals(3, container0.getTasks().size());
assertEquals(2, container1.getTasks().size());
assertTrue(container0.getTasks().containsKey(getTaskName(0)));
assertTrue(container0.getTasks().containsKey(getTaskName(2)));
assertTrue(container0.getTasks().containsKey(getTaskName(4)));
assertTrue(container1.getTasks().containsKey(getTaskName(1)));
assertTrue(container1.getTasks().containsKey(getTaskName(3)));
}
@Test
public void testGroupManyTasks() {
Set<TaskModel> taskModels = generateTaskModels(21);
Set<ContainerModel> containers = new GroupByContainerCount(2).group(taskModels);
Map<String, ContainerModel> containersMap = new HashMap<>();
for (ContainerModel container : containers) {
containersMap.put(container.getProcessorId(), container);
}
assertEquals(2, containers.size());
ContainerModel container0 = containersMap.get("0");
ContainerModel container1 = containersMap.get("1");
assertNotNull(container0);
assertNotNull(container1);
assertEquals("0", container0.getProcessorId());
assertEquals("1", container1.getProcessorId());
assertEquals(11, container0.getTasks().size());
assertEquals(10, container1.getTasks().size());
// NOTE: tasks are sorted lexicographically, so the container assignment
// can seem odd, but the consistency is the key focus
assertTrue(container0.getTasks().containsKey(getTaskName(0)));
assertTrue(container0.getTasks().containsKey(getTaskName(10)));
assertTrue(container0.getTasks().containsKey(getTaskName(12)));
assertTrue(container0.getTasks().containsKey(getTaskName(14)));
assertTrue(container0.getTasks().containsKey(getTaskName(16)));
assertTrue(container0.getTasks().containsKey(getTaskName(18)));
assertTrue(container0.getTasks().containsKey(getTaskName(2)));
assertTrue(container0.getTasks().containsKey(getTaskName(3)));
assertTrue(container0.getTasks().containsKey(getTaskName(5)));
assertTrue(container0.getTasks().containsKey(getTaskName(7)));
assertTrue(container0.getTasks().containsKey(getTaskName(9)));
assertTrue(container1.getTasks().containsKey(getTaskName(1)));
assertTrue(container1.getTasks().containsKey(getTaskName(11)));
assertTrue(container1.getTasks().containsKey(getTaskName(13)));
assertTrue(container1.getTasks().containsKey(getTaskName(15)));
assertTrue(container1.getTasks().containsKey(getTaskName(17)));
assertTrue(container1.getTasks().containsKey(getTaskName(19)));
assertTrue(container1.getTasks().containsKey(getTaskName(20)));
assertTrue(container1.getTasks().containsKey(getTaskName(4)));
assertTrue(container1.getTasks().containsKey(getTaskName(6)));
assertTrue(container1.getTasks().containsKey(getTaskName(8)));
}
/**
* Before:
* C0 C1
* --------
* T0 T1
* T2 T3
* T4 T5
* T6 T7
* T8
*
* After:
* C0 C1 C2 C3
* ----------------
* T0 T1 T6 T5
* T2 T3 T8 T7
* T4
*
* NOTE for host affinity, it would help to have some additional logic to reassign tasks
* from C0 and C1 to containers that were on the same respective hosts, it wasn't implemented
* because the scenario is infrequent, the benefits are not guaranteed, and the code complexity
* wasn't worth it. It certainly could be implemented in the future.
*/
@Test
public void testBalancerAfterContainerIncrease() {
Set<TaskModel> taskModels = generateTaskModels(9);
Set<ContainerModel> prevContainers = new GroupByContainerCount(2).group(taskModels);
Map<String, String> prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
Set<ContainerModel> containers = new GroupByContainerCount(4).balance(taskModels, localityManager);
Map<String, ContainerModel> containersMap = new HashMap<>();
for (ContainerModel container : containers) {
containersMap.put(container.getProcessorId(), container);
}
assertEquals(4, containers.size());
ContainerModel container0 = containersMap.get("0");
ContainerModel container1 = containersMap.get("1");
ContainerModel container2 = containersMap.get("2");
ContainerModel container3 = containersMap.get("3");
assertNotNull(container0);
assertNotNull(container1);
assertNotNull(container2);
assertNotNull(container3);
assertEquals("0", container0.getProcessorId());
assertEquals("1", container1.getProcessorId());
assertEquals(3, container0.getTasks().size());
assertEquals(2, container1.getTasks().size());
assertEquals(2, container2.getTasks().size());
assertEquals(2, container3.getTasks().size());
// Tasks 0-4 should stay on the same original containers
assertTrue(container0.getTasks().containsKey(getTaskName(0)));
assertTrue(container0.getTasks().containsKey(getTaskName(2)));
assertTrue(container0.getTasks().containsKey(getTaskName(4)));
assertTrue(container1.getTasks().containsKey(getTaskName(1)));
assertTrue(container1.getTasks().containsKey(getTaskName(3)));
// Tasks 5-8 should be reassigned to the new containers.
// Consistency is the goal with these reassignments
assertTrue(container2.getTasks().containsKey(getTaskName(8)));
assertTrue(container2.getTasks().containsKey(getTaskName(6)));
assertTrue(container3.getTasks().containsKey(getTaskName(5)));
assertTrue(container3.getTasks().containsKey(getTaskName(7)));
// Verify task mappings are saved
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(0).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(2).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(4).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(1).getTaskName(), "1");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(3).getTaskName(), "1");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(8).getTaskName(), "2");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(6).getTaskName(), "2");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(5).getTaskName(), "3");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(7).getTaskName(), "3");
verify(taskAssignmentManager, never()).deleteTaskContainerMappings(anyCollection());
}
/**
* Before:
* C0 C1 C2 C3
* ----------------
* T0 T1 T2 T3
* T4 T5 T6 T7
* T8
*
* After:
* C0 C1
* --------
* T0 T1
* T4 T5
* T8 T7
* T6 T3
* T2
*
* NOTE for host affinity, it would help to have some additional logic to reassign tasks
* from C2 and C3 to containers that were on the same respective hosts, it wasn't implemented
* because the scenario is infrequent, the benefits are not guaranteed, and the code complexity
* wasn't worth it. It certainly could be implemented in the future.
*/
@Test
public void testBalancerAfterContainerDecrease() {
Set<TaskModel> taskModels = generateTaskModels(9);
Set<ContainerModel> prevContainers = new GroupByContainerCount(4).group(taskModels);
Map<String, String> prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
Set<ContainerModel> containers = new GroupByContainerCount(2).balance(taskModels, localityManager);
Map<String, ContainerModel> containersMap = new HashMap<>();
for (ContainerModel container : containers) {
containersMap.put(container.getProcessorId(), container);
}
assertEquals(2, containers.size());
ContainerModel container0 = containersMap.get("0");
ContainerModel container1 = containersMap.get("1");
assertNotNull(container0);
assertNotNull(container1);
assertEquals("0", container0.getProcessorId());
assertEquals("1", container1.getProcessorId());
assertEquals(5, container0.getTasks().size());
assertEquals(4, container1.getTasks().size());
// Tasks 0,4,8 and 1,5 should stay on the same original containers
assertTrue(container0.getTasks().containsKey(getTaskName(0)));
assertTrue(container0.getTasks().containsKey(getTaskName(4)));
assertTrue(container0.getTasks().containsKey(getTaskName(8)));
assertTrue(container1.getTasks().containsKey(getTaskName(1)));
assertTrue(container1.getTasks().containsKey(getTaskName(5)));
// Tasks 2,6 and 3,7 should be reassigned to the new containers.
// Consistency is the goal with these reassignments
assertTrue(container0.getTasks().containsKey(getTaskName(6)));
assertTrue(container0.getTasks().containsKey(getTaskName(2)));
assertTrue(container1.getTasks().containsKey(getTaskName(7)));
assertTrue(container1.getTasks().containsKey(getTaskName(3)));
// Verify task mappings are saved
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(0).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(4).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(8).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(6).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(2).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(1).getTaskName(), "1");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(5).getTaskName(), "1");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(7).getTaskName(), "1");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(3).getTaskName(), "1");
verify(taskAssignmentManager, never()).deleteTaskContainerMappings(anyCollection());
}
/**
* Before:
* C0 C1 C2 C3
* ----------------
* T0 T1 T2 T3
* T4 T5 T6 T7
* T8
*
* Intermediate:
* C0 C1
* --------
* T0 T1
* T4 T5
* T8 T7
* T6 T3
* T2
*
* After:
* C0 C1 C2
* ------------
* T0 T1 T6
* T4 T5 T2
* T8 T7 T3
*/
@Test
public void testBalancerMultipleReblances() {
// Before
Set<TaskModel> taskModels = generateTaskModels(9);
Set<ContainerModel> prevContainers = new GroupByContainerCount(4).group(taskModels);
Map<String, String> prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
// First balance
Set<ContainerModel> containers = new GroupByContainerCount(2).balance(taskModels, localityManager);
Map<String, ContainerModel> containersMap = new HashMap<>();
for (ContainerModel container : containers) {
containersMap.put(container.getProcessorId(), container);
}
assertEquals(2, containers.size());
ContainerModel container0 = containersMap.get("0");
ContainerModel container1 = containersMap.get("1");
assertNotNull(container0);
assertNotNull(container1);
assertEquals("0", container0.getProcessorId());
assertEquals("1", container1.getProcessorId());
assertEquals(5, container0.getTasks().size());
assertEquals(4, container1.getTasks().size());
// Tasks 0,4,8 and 1,5 should stay on the same original containers
assertTrue(container0.getTasks().containsKey(getTaskName(0)));
assertTrue(container0.getTasks().containsKey(getTaskName(4)));
assertTrue(container0.getTasks().containsKey(getTaskName(8)));
assertTrue(container1.getTasks().containsKey(getTaskName(1)));
assertTrue(container1.getTasks().containsKey(getTaskName(5)));
// Tasks 2,6 and 3,7 should be reassigned to the new containers.
// Consistency is the goal with these reassignments
assertTrue(container0.getTasks().containsKey(getTaskName(6)));
assertTrue(container0.getTasks().containsKey(getTaskName(2)));
assertTrue(container1.getTasks().containsKey(getTaskName(7)));
assertTrue(container1.getTasks().containsKey(getTaskName(3)));
// Verify task mappings are saved
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(0).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(4).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(8).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(6).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(2).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(1).getTaskName(), "1");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(5).getTaskName(), "1");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(7).getTaskName(), "1");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(3).getTaskName(), "1");
verify(taskAssignmentManager, never()).deleteTaskContainerMappings(anyCollection());
// Second balance
prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
TaskAssignmentManager taskAssignmentManager2 = mock(TaskAssignmentManager.class);
when(taskAssignmentManager2.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
LocalityManager localityManager2 = mock(LocalityManager.class);
when(localityManager2.getTaskAssignmentManager()).thenReturn(taskAssignmentManager2);
containers = new GroupByContainerCount(3).balance(taskModels, localityManager2);
containersMap = new HashMap<>();
for (ContainerModel container : containers) {
containersMap.put(container.getProcessorId(), container);
}
assertEquals(3, containers.size());
container0 = containersMap.get("0");
container1 = containersMap.get("1");
ContainerModel container2 = containersMap.get("2");
assertNotNull(container0);
assertNotNull(container1);
assertNotNull(container2);
assertEquals("0", container0.getProcessorId());
assertEquals("1", container1.getProcessorId());
assertEquals("2", container2.getProcessorId());
assertEquals(3, container0.getTasks().size());
assertEquals(3, container1.getTasks().size());
assertEquals(3, container2.getTasks().size());
// Tasks 0,4,8 and 1,5,7 should stay on the same original containers
assertTrue(container0.getTasks().containsKey(getTaskName(0)));
assertTrue(container0.getTasks().containsKey(getTaskName(4)));
assertTrue(container0.getTasks().containsKey(getTaskName(8)));
assertTrue(container1.getTasks().containsKey(getTaskName(1)));
assertTrue(container1.getTasks().containsKey(getTaskName(5)));
assertTrue(container1.getTasks().containsKey(getTaskName(7)));
// Tasks 2,6 and 3 should be reassigned to the new container.
// Consistency is the goal with these reassignments
assertTrue(container2.getTasks().containsKey(getTaskName(6)));
assertTrue(container2.getTasks().containsKey(getTaskName(2)));
assertTrue(container2.getTasks().containsKey(getTaskName(3)));
// Verify task mappings are saved
verify(taskAssignmentManager2).writeTaskContainerMapping(getTaskName(0).getTaskName(), "0");
verify(taskAssignmentManager2).writeTaskContainerMapping(getTaskName(4).getTaskName(), "0");
verify(taskAssignmentManager2).writeTaskContainerMapping(getTaskName(8).getTaskName(), "0");
verify(taskAssignmentManager2).writeTaskContainerMapping(getTaskName(1).getTaskName(), "1");
verify(taskAssignmentManager2).writeTaskContainerMapping(getTaskName(5).getTaskName(), "1");
verify(taskAssignmentManager2).writeTaskContainerMapping(getTaskName(7).getTaskName(), "1");
verify(taskAssignmentManager2).writeTaskContainerMapping(getTaskName(6).getTaskName(), "2");
verify(taskAssignmentManager2).writeTaskContainerMapping(getTaskName(2).getTaskName(), "2");
verify(taskAssignmentManager2).writeTaskContainerMapping(getTaskName(3).getTaskName(), "2");
verify(taskAssignmentManager2, never()).deleteTaskContainerMappings(anyCollection());
}
/**
* Before:
* C0 C1
* --------
* T0 T1
* T2 T3
* T4 T5
* T6 T7
* T8
*
* After:
* C0 C1
* --------
* T0 T1
* T2 T3
* T4 T5
* T6 T7
* T8
*/
@Test
public void testBalancerAfterContainerSame() {
Set<TaskModel> taskModels = generateTaskModels(9);
Set<ContainerModel> prevContainers = new GroupByContainerCount(2).group(taskModels);
Map<String, String> prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
Set<ContainerModel> containers = new GroupByContainerCount(2).balance(taskModels, localityManager);
Map<String, ContainerModel> containersMap = new HashMap<>();
for (ContainerModel container : containers) {
containersMap.put(container.getProcessorId(), container);
}
assertEquals(2, containers.size());
ContainerModel container0 = containersMap.get("0");
ContainerModel container1 = containersMap.get("1");
assertNotNull(container0);
assertNotNull(container1);
assertEquals("0", container0.getProcessorId());
assertEquals("1", container1.getProcessorId());
assertEquals(5, container0.getTasks().size());
assertEquals(4, container1.getTasks().size());
assertTrue(container0.getTasks().containsKey(getTaskName(0)));
assertTrue(container0.getTasks().containsKey(getTaskName(2)));
assertTrue(container0.getTasks().containsKey(getTaskName(4)));
assertTrue(container0.getTasks().containsKey(getTaskName(6)));
assertTrue(container0.getTasks().containsKey(getTaskName(8)));
assertTrue(container1.getTasks().containsKey(getTaskName(1)));
assertTrue(container1.getTasks().containsKey(getTaskName(3)));
assertTrue(container1.getTasks().containsKey(getTaskName(5)));
assertTrue(container1.getTasks().containsKey(getTaskName(7)));
verify(taskAssignmentManager, never()).writeTaskContainerMapping(anyString(), anyString());
verify(taskAssignmentManager, never()).deleteTaskContainerMappings(anyCollection());
}
/**
* Verifies the ability to have a custom task-container mapping that is *deliberately* unbalanced.
*
* Before:
* C0 C1
* --------
* T0 T6
* T1 T7
* T2 T8
* T3
* T4
* T5
*
* After:
* C0 C1
* --------
* T0 T6
* T1 T7
* T2 T8
* T3
* T4
* T5
*/
@Test
public void testBalancerAfterContainerSameCustomAssignment() {
Set<TaskModel> taskModels = generateTaskModels(9);
Map<String, String> prevTaskToContainerMapping = new HashMap<>();
prevTaskToContainerMapping.put(getTaskName(0).getTaskName(), "0");
prevTaskToContainerMapping.put(getTaskName(1).getTaskName(), "0");
prevTaskToContainerMapping.put(getTaskName(2).getTaskName(), "0");
prevTaskToContainerMapping.put(getTaskName(3).getTaskName(), "0");
prevTaskToContainerMapping.put(getTaskName(4).getTaskName(), "0");
prevTaskToContainerMapping.put(getTaskName(5).getTaskName(), "0");
prevTaskToContainerMapping.put(getTaskName(6).getTaskName(), "1");
prevTaskToContainerMapping.put(getTaskName(7).getTaskName(), "1");
prevTaskToContainerMapping.put(getTaskName(8).getTaskName(), "1");
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
Set<ContainerModel> containers = new GroupByContainerCount(2).balance(taskModels, localityManager);
Map<String, ContainerModel> containersMap = new HashMap<>();
for (ContainerModel container : containers) {
containersMap.put(container.getProcessorId(), container);
}
assertEquals(2, containers.size());
ContainerModel container0 = containersMap.get("0");
ContainerModel container1 = containersMap.get("1");
assertNotNull(container0);
assertNotNull(container1);
assertEquals("0", container0.getProcessorId());
assertEquals("1", container1.getProcessorId());
assertEquals(6, container0.getTasks().size());
assertEquals(3, container1.getTasks().size());
assertTrue(container0.getTasks().containsKey(getTaskName(0)));
assertTrue(container0.getTasks().containsKey(getTaskName(1)));
assertTrue(container0.getTasks().containsKey(getTaskName(2)));
assertTrue(container0.getTasks().containsKey(getTaskName(3)));
assertTrue(container0.getTasks().containsKey(getTaskName(4)));
assertTrue(container0.getTasks().containsKey(getTaskName(5)));
assertTrue(container1.getTasks().containsKey(getTaskName(6)));
assertTrue(container1.getTasks().containsKey(getTaskName(7)));
assertTrue(container1.getTasks().containsKey(getTaskName(8)));
verify(taskAssignmentManager, never()).writeTaskContainerMapping(anyString(), anyString());
verify(taskAssignmentManager, never()).deleteTaskContainerMappings(anyCollection());
}
/**
* Verifies the ability to have a custom task-container mapping that is *deliberately* unbalanced.
*
* Before:
* C0 C1
* --------
* T0 T1
* T2
* T3
* T4
* T5
*
* After:
* C0 C1 C2
* ------------
* T0 T1 T4
* T5 T2 T3
*
* The key here is that C0, which is not one of the new containers was under-allocated.
* This is an important case because this scenario, while impossible with GroupByContainerCount.group()
* could occur when the grouper class is switched or if there is a custom mapping.
*/
@Test
public void testBalancerAfterContainerSameCustomAssignmentAndContainerIncrease() {
Set<TaskModel> taskModels = generateTaskModels(6);
Map<String, String> prevTaskToContainerMapping = new HashMap<>();
prevTaskToContainerMapping.put(getTaskName(0).getTaskName(), "0");
prevTaskToContainerMapping.put(getTaskName(1).getTaskName(), "1");
prevTaskToContainerMapping.put(getTaskName(2).getTaskName(), "1");
prevTaskToContainerMapping.put(getTaskName(3).getTaskName(), "1");
prevTaskToContainerMapping.put(getTaskName(4).getTaskName(), "1");
prevTaskToContainerMapping.put(getTaskName(5).getTaskName(), "1");
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
Set<ContainerModel> containers = new GroupByContainerCount(3).balance(taskModels, localityManager);
Map<String, ContainerModel> containersMap = new HashMap<>();
for (ContainerModel container : containers) {
containersMap.put(container.getProcessorId(), container);
}
assertEquals(3, containers.size());
ContainerModel container0 = containersMap.get("0");
ContainerModel container1 = containersMap.get("1");
ContainerModel container2 = containersMap.get("2");
assertNotNull(container0);
assertNotNull(container1);
assertNotNull(container2);
assertEquals("0", container0.getProcessorId());
assertEquals("1", container1.getProcessorId());
assertEquals("2", container2.getProcessorId());
assertEquals(2, container0.getTasks().size());
assertEquals(2, container1.getTasks().size());
assertEquals(2, container1.getTasks().size());
assertTrue(container0.getTasks().containsKey(getTaskName(0)));
assertTrue(container0.getTasks().containsKey(getTaskName(5)));
assertTrue(container1.getTasks().containsKey(getTaskName(1)));
assertTrue(container1.getTasks().containsKey(getTaskName(2)));
assertTrue(container2.getTasks().containsKey(getTaskName(4)));
assertTrue(container2.getTasks().containsKey(getTaskName(3)));
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(0).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(1).getTaskName(), "1");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(2).getTaskName(), "1");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(3).getTaskName(), "2");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(4).getTaskName(), "2");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(5).getTaskName(), "0");
verify(taskAssignmentManager, never()).deleteTaskContainerMappings(anyCollection());
}
@Test
public void testBalancerOldContainerCountOne() {
Set<TaskModel> taskModels = generateTaskModels(3);
Set<ContainerModel> prevContainers = new GroupByContainerCount(1).group(taskModels);
Map<String, String> prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
Set<ContainerModel> groupContainers = new GroupByContainerCount(3).group(taskModels);
Set<ContainerModel> balanceContainers = new GroupByContainerCount(3).balance(taskModels, localityManager);
// Results should be the same as calling group()
assertEquals(groupContainers, balanceContainers);
// Verify task mappings are saved
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(0).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(1).getTaskName(), "1");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(2).getTaskName(), "2");
verify(taskAssignmentManager, never()).deleteTaskContainerMappings(anyCollection());
}
@Test
public void testBalancerNewContainerCountOne() {
Set<TaskModel> taskModels = generateTaskModels(3);
Set<ContainerModel> prevContainers = new GroupByContainerCount(3).group(taskModels);
Map<String, String> prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
Set<ContainerModel> groupContainers = new GroupByContainerCount(1).group(taskModels);
Set<ContainerModel> balanceContainers = new GroupByContainerCount(1).balance(taskModels, localityManager);
// Results should be the same as calling group()
assertEquals(groupContainers, balanceContainers);
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(0).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(1).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(2).getTaskName(), "0");
verify(taskAssignmentManager, never()).deleteTaskContainerMappings(anyCollection());
}
@Test
public void testBalancerEmptyTaskMapping() {
Set<TaskModel> taskModels = generateTaskModels(3);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(new HashMap<String, String>());
Set<ContainerModel> groupContainers = new GroupByContainerCount(1).group(taskModels);
Set<ContainerModel> balanceContainers = new GroupByContainerCount(1).balance(taskModels, localityManager);
// Results should be the same as calling group()
assertEquals(groupContainers, balanceContainers);
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(0).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(1).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(2).getTaskName(), "0");
verify(taskAssignmentManager, never()).deleteTaskContainerMappings(anyCollection());
}
@Test
public void testGroupTaskCountIncrease() {
int taskCount = 3;
Set<TaskModel> taskModels = generateTaskModels(taskCount);
Set<ContainerModel> prevContainers = new GroupByContainerCount(2).group(generateTaskModels(taskCount - 1)); // Here's the key step
Map<String, String> prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
Set<ContainerModel> groupContainers = new GroupByContainerCount(1).group(taskModels);
Set<ContainerModel> balanceContainers = new GroupByContainerCount(1).balance(taskModels, localityManager);
// Results should be the same as calling group()
assertEquals(groupContainers, balanceContainers);
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(0).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(1).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(2).getTaskName(), "0");
verify(taskAssignmentManager).deleteTaskContainerMappings(anyCollection());
}
@Test
public void testGroupTaskCountDecrease() {
int taskCount = 3;
Set<TaskModel> taskModels = generateTaskModels(taskCount);
Set<ContainerModel> prevContainers = new GroupByContainerCount(3).group(generateTaskModels(taskCount + 1)); // Here's the key step
Map<String, String> prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
Set<ContainerModel> groupContainers = new GroupByContainerCount(1).group(taskModels);
Set<ContainerModel> balanceContainers = new GroupByContainerCount(1).balance(taskModels, localityManager);
// Results should be the same as calling group()
assertEquals(groupContainers, balanceContainers);
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(0).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(1).getTaskName(), "0");
verify(taskAssignmentManager).writeTaskContainerMapping(getTaskName(2).getTaskName(), "0");
verify(taskAssignmentManager).deleteTaskContainerMappings(anyCollection());
}
@Test(expected = IllegalArgumentException.class)
public void testBalancerNewContainerCountGreaterThanTasks() {
Set<TaskModel> taskModels = generateTaskModels(3);
Set<ContainerModel> prevContainers = new GroupByContainerCount(3).group(taskModels);
Map<String, String> prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
new GroupByContainerCount(5).balance(taskModels, localityManager); // Should throw
}
@Test(expected = IllegalArgumentException.class)
public void testBalancerEmptyTasks() {
Set<TaskModel> taskModels = generateTaskModels(3);
Set<ContainerModel> prevContainers = new GroupByContainerCount(3).group(taskModels);
Map<String, String> prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
new GroupByContainerCount(5).balance(new HashSet<TaskModel>(), localityManager); // Should throw
}
@Test(expected = UnsupportedOperationException.class)
public void testBalancerResultImmutable() {
Set<TaskModel> taskModels = generateTaskModels(3);
Set<ContainerModel> prevContainers = new GroupByContainerCount(3).group(taskModels);
Map<String, String> prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
Set<ContainerModel> containers = new GroupByContainerCount(2).balance(taskModels, localityManager);
containers.remove(containers.iterator().next());
}
@Test(expected = SamzaException.class)
public void testBalancerThrowsOnNonIntegerContainerIds() {
Set<TaskModel> taskModels = generateTaskModels(3);
Set<ContainerModel> prevContainers = new HashSet<>();
taskModels.forEach(model -> {
prevContainers.add(
new ContainerModel(UUID.randomUUID().toString(), -1, Collections.singletonMap(model.getTaskName(), model)));
});
Map<String, String> prevTaskToContainerMapping = generateTaskContainerMapping(prevContainers);
when(taskAssignmentManager.readTaskAssignment()).thenReturn(prevTaskToContainerMapping);
new GroupByContainerCount(3).balance(taskModels, localityManager); //Should throw
}
@Test
public void testBalancerWithNullLocalityManager() {
Set<TaskModel> taskModels = generateTaskModels(3);
Set<ContainerModel> groupContainers = new GroupByContainerCount(3).group(taskModels);
Set<ContainerModel> balanceContainers = new GroupByContainerCount(3).balance(taskModels, null);
// Results should be the same as calling group()
assertEquals(groupContainers, balanceContainers);
}
}