| #!/usr/bin/python |
| |
| # Licensed to the Apache Software Foundation (ASF) under one or more |
| # contributor license agreements. See the NOTICE file distributed with |
| # this work for additional information regarding copyright ownership. |
| # The ASF licenses this file to You under the Apache License, Version 2.0 |
| # (the "License"); you may not use this file except in compliance with |
| # the License. You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, software |
| # distributed under the License is distributed on an "AS IS" BASIS, |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| # See the License for the specific language governing permissions and |
| # limitations under the License. |
| |
| import os |
| import time |
| import re |
| import logging |
| from blockadeUtils.blockade import Blockade |
| from clusterUtils.cluster_utils import ClusterUtils |
| |
| logger = logging.getLogger(__name__) |
| parent_dir = os.path.dirname(os.path.dirname(os.path.realpath(__file__))) |
| FILE = os.path.join(parent_dir, "compose", "ozoneblockade", |
| "docker-compose.yaml") |
| os.environ["DOCKER_COMPOSE_FILE"] = FILE |
| SCALE = 3 |
| INCREASED_SCALE = 5 |
| CONTAINER_LIST = [] |
| OM = [] |
| SCM = [] |
| DATANODES = [] |
| |
| |
| def setup(): |
| global CONTAINER_LIST, OM, SCM, DATANODES |
| Blockade.blockade_destroy() |
| CONTAINER_LIST = ClusterUtils.cluster_setup(FILE, SCALE) |
| exit_code, output = Blockade.blockade_status() |
| assert exit_code == 0, "blockade status command failed with output=[%s]" % \ |
| output |
| OM, SCM, _, DATANODES = \ |
| ClusterUtils.find_om_scm_client_datanodes(CONTAINER_LIST) |
| |
| exit_code, output = ClusterUtils.run_freon(FILE, 1, 1, 1, 10240, "RATIS", |
| "THREE") |
| assert exit_code == 0, "freon run failed with output=[%s]" % output |
| |
| |
| def teardown(): |
| logger.info("Inside teardown") |
| Blockade.blockade_destroy() |
| |
| |
| def teardown_module(): |
| ClusterUtils.cluster_destroy(FILE) |
| |
| |
| def test_scm_isolation_one_node(run_second_phase): |
| """ |
| In this test, one of the datanodes cannot communicate with SCM. |
| Other datanodes can communicate with SCM. |
| Expectation : The container should eventually have at least two closed |
| replicas. |
| """ |
| first_set = [OM[0], DATANODES[0], DATANODES[1], DATANODES[2]] |
| second_set = [OM[0], SCM[0], DATANODES[1], DATANODES[2]] |
| Blockade.blockade_create_partition(first_set, second_set) |
| Blockade.blockade_status() |
| ClusterUtils.run_freon(FILE, 1, 1, 1, 10240, "RATIS", "THREE") |
| logger.info("Waiting for %s seconds before checking container status", |
| os.environ["CONTAINER_STATUS_SLEEP"]) |
| time.sleep(int(os.environ["CONTAINER_STATUS_SLEEP"])) |
| all_datanodes_container_status = \ |
| ClusterUtils.findall_container_status(FILE, SCALE) |
| closed_container_datanodes = [x for x in all_datanodes_container_status |
| if x == 'CLOSED'] |
| assert len(closed_container_datanodes) >= 2, \ |
| "The container should have at least two closed replicas." |
| |
| if str(run_second_phase).lower() == "true": |
| ClusterUtils.cluster_setup(FILE, INCREASED_SCALE, False) |
| Blockade.blockade_status() |
| logger.info("Waiting for %s seconds before checking container status", |
| os.environ["CONTAINER_STATUS_SLEEP"]) |
| time.sleep(int(os.environ["CONTAINER_STATUS_SLEEP"])) |
| all_datanodes_container_status = \ |
| ClusterUtils.findall_container_status(FILE, INCREASED_SCALE) |
| closed_container_datanodes = [x for x in all_datanodes_container_status |
| if x == 'CLOSED'] |
| assert len(closed_container_datanodes) >= 3, \ |
| "The container should have at least three closed replicas." |
| Blockade.blockade_join() |
| Blockade.blockade_status() |
| _, output = \ |
| ClusterUtils.run_freon(FILE, 1, 1, 1, 10240, "RATIS", "THREE") |
| assert re.search("Status: Success", output) is not None |
| |
| |
| def test_scm_isolation_two_node(run_second_phase): |
| """ |
| In this test, two datanodes cannot communicate with SCM. |
| Expectation : The container should eventually have at three closed replicas |
| or, two open replicas and one quasi-closed replica. |
| """ |
| first_set = [OM[0], DATANODES[0], DATANODES[1], DATANODES[2]] |
| second_set = [OM[0], SCM[0], DATANODES[1]] |
| Blockade.blockade_create_partition(first_set, second_set) |
| Blockade.blockade_status() |
| ClusterUtils.run_freon(FILE, 1, 1, 1, 10240, "RATIS", "THREE") |
| logger.info("Waiting for %s seconds before checking container status", |
| os.environ["CONTAINER_STATUS_SLEEP"]) |
| time.sleep(int(os.environ["CONTAINER_STATUS_SLEEP"])) |
| all_datanodes_container_status = \ |
| ClusterUtils.findall_container_status(FILE, SCALE) |
| closed_container_datanodes = [x for x in all_datanodes_container_status |
| if x == 'CLOSED'] |
| qausiclosed_container_datanodes = [x for x in all_datanodes_container_status |
| if x == 'QUASI_CLOSED'] |
| count_open_container_datanodes = [x for x in all_datanodes_container_status |
| if x == 'OPEN'] |
| assert len(closed_container_datanodes) == 3 or \ |
| (len(count_open_container_datanodes) == 2 and |
| len(qausiclosed_container_datanodes) == 1), \ |
| "The container should have three closed replicas or two open " \ |
| "replicas and one quasi_closed replica." |
| |
| if str(run_second_phase).lower() == "true": |
| ClusterUtils.cluster_setup(FILE, INCREASED_SCALE, False) |
| Blockade.blockade_status() |
| logger.info("Waiting for %s seconds before checking container status", |
| os.environ["CONTAINER_STATUS_SLEEP"]) |
| time.sleep(int(os.environ["CONTAINER_STATUS_SLEEP"])) |
| all_datanodes_container_status = \ |
| ClusterUtils.findall_container_status(FILE, INCREASED_SCALE) |
| closed_container_datanodes = [x for x in all_datanodes_container_status |
| if x == 'CLOSED'] |
| qausiclosed_container_datanodes = \ |
| [x for x in all_datanodes_container_status if x == 'QUASI_CLOSED'] |
| assert len(closed_container_datanodes) >= 3 or \ |
| len(qausiclosed_container_datanodes) >= 3 |
| Blockade.blockade_join() |
| Blockade.blockade_status() |
| if len(closed_container_datanodes) < 3: |
| time.sleep(int(os.environ["CONTAINER_STATUS_SLEEP"])) |
| all_datanodes_container_status = \ |
| ClusterUtils.findall_container_status(FILE, INCREASED_SCALE) |
| closed_container_datanodes = [x for x in all_datanodes_container_status |
| if x == 'CLOSED'] |
| |
| assert len(closed_container_datanodes) >= 3 |
| _, output = \ |
| ClusterUtils.run_freon(FILE, 1, 1, 1, 10240, "RATIS", "THREE") |
| assert re.search("Status: Success", output) is not None |