| # |
| # Licensed to the Apache Software Foundation (ASF) under one or more |
| # contributor license agreements. See the NOTICE file distributed with |
| # this work for additional information regarding copyright ownership. |
| # The ASF licenses this file to You under the Apache License, Version 2.0 |
| # (the "License"); you may not use this file except in compliance with |
| # the License. You may obtain a copy of the License at |
| # |
| # http://www.apache.org/licenses/LICENSE-2.0 |
| # |
| # Unless required by applicable law or agreed to in writing, software |
| # distributed under the License is distributed on an "AS IS" BASIS, |
| # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| # See the License for the specific language governing permissions and |
| # limitations under the License. |
| # |
| |
| """Unit tests for the processes module.""" |
| |
| # pytype: skip-file |
| |
| import atexit |
| import glob |
| import os |
| import random |
| import re |
| import shutil |
| import socketserver |
| import subprocess |
| import tempfile |
| import threading |
| import unittest |
| from unittest.mock import patch |
| |
| from apache_beam.runners.portability import job_server |
| from apache_beam.utils import subprocess_server |
| |
| |
| class JavaJarServerTest(unittest.TestCase): |
| |
| # TODO(https://github.com/grpc/grpc/issues/37710): Remove once fixed. |
| @classmethod |
| def setUpClass(cls): |
| cls._old_fork_support = os.environ.get('GRPC_ENABLE_FORK_SUPPORT') |
| os.environ['GRPC_ENABLE_FORK_SUPPORT'] = 'false' |
| super().setUpClass() |
| |
| # TODO(https://github.com/grpc/grpc/issues/37710): Remove once fixed. |
| @classmethod |
| def tearDownClass(cls): |
| if cls._old_fork_support is None: |
| os.environ.pop('GRPC_ENABLE_FORK_SUPPORT', None) |
| else: |
| os.environ['GRPC_ENABLE_FORK_SUPPORT'] = cls._old_fork_support |
| super().tearDownClass() |
| |
| def test_gradle_jar_release(self): |
| self.assertEqual( |
| 'https://repo.maven.apache.org/maven2/org/apache/beam/' |
| 'beam-sdks-java-fake/VERSION/beam-sdks-java-fake-VERSION.jar', |
| subprocess_server.JavaJarServer.path_to_beam_jar( |
| ':sdks:java:fake:fatJar', version='VERSION')) |
| self.assertEqual( |
| 'https://repo.maven.apache.org/maven2/org/apache/beam/' |
| 'beam-sdks-java-fake/VERSION/beam-sdks-java-fake-A-VERSION.jar', |
| subprocess_server.JavaJarServer.path_to_beam_jar( |
| ':sdks:java:fake:fatJar', appendix='A', version='VERSION')) |
| self.assertEqual( |
| 'https://repo.maven.apache.org/maven2/org/apache/beam/' |
| 'beam-sdks-java-fake/VERSION/beam-sdks-java-fake-A-VERSION.jar', |
| subprocess_server.JavaJarServer.path_to_beam_jar( |
| ':gradle:target:doesnt:matter', |
| appendix='A', |
| version='VERSION', |
| artifact_id='beam-sdks-java-fake')) |
| self.assertEqual( |
| 'https://repository.apache.org/content/groups/staging/org/apache/beam/' |
| 'beam-sdks-java-fake/2.99.9/beam-sdks-java-fake-2.99.9.jar', |
| subprocess_server.JavaJarServer.path_to_beam_jar( |
| ':sdks:java:fake:fatJar', version='2.99.9rc2')) |
| |
| def test_gradle_jar_dev(self): |
| with self.assertRaisesRegex( |
| Exception, |
| re.escape(os.path.join('sdks', |
| 'java', |
| 'fake', |
| 'build', |
| 'libs', |
| 'beam-sdks-java-fake-VERSION-SNAPSHOT.jar')) + |
| ' not found.'): |
| subprocess_server.JavaJarServer.path_to_beam_jar( |
| ':sdks:java:fake:fatJar', version='VERSION.dev') |
| with self.assertRaisesRegex( |
| Exception, |
| re.escape(os.path.join('sdks', |
| 'java', |
| 'fake', |
| 'build', |
| 'libs', |
| 'beam-sdks-java-fake-A-VERSION-SNAPSHOT.jar')) + |
| ' not found.'): |
| subprocess_server.JavaJarServer.path_to_beam_jar( |
| ':sdks:java:fake:fatJar', appendix='A', version='VERSION.dev') |
| with self.assertRaisesRegex( |
| Exception, |
| re.escape(os.path.join('sdks', |
| 'java', |
| 'fake', |
| 'build', |
| 'libs', |
| 'fake-artifact-id-A-VERSION-SNAPSHOT.jar')) + |
| ' not found.'): |
| subprocess_server.JavaJarServer.path_to_beam_jar( |
| ':sdks:java:fake:fatJar', |
| appendix='A', |
| version='VERSION.dev', |
| artifact_id='fake-artifact-id') |
| |
| def test_beam_services(self): |
| with subprocess_server.JavaJarServer.beam_services({':some:target': 'foo'}): |
| self.assertEqual( |
| 'foo', |
| subprocess_server.JavaJarServer.path_to_beam_jar(':some:target')) |
| |
| def test_local_jar(self): |
| class Handler(socketserver.BaseRequestHandler): |
| timeout = 1 |
| |
| def handle(self): |
| data = self.request.recv(1024) |
| if 'User-Agent: Apache Beam SDK for Python' in str(data): |
| self.request.sendall(b'HTTP/1.1 200 OK\n\ndata') |
| else: |
| self.request.sendall(b'HTTP/1.1 400 BAD REQUEST\n\n') |
| |
| port, = subprocess_server.pick_port(None) |
| server = socketserver.TCPServer(('localhost', port), Handler) |
| t = threading.Thread(target=server.handle_request) |
| t.daemon = True |
| t.start() |
| |
| with tempfile.TemporaryDirectory() as temp_dir: |
| subprocess_server.JavaJarServer.local_jar( |
| 'http://localhost:%s/path/to/file.jar' % port, temp_dir) |
| with open(os.path.join(temp_dir, 'file.jar')) as fin: |
| self.assertEqual(fin.read(), 'data') |
| |
| def test_local_jar_fallback_to_google_maven_mirror(self): |
| """Test that Google Maven mirror is used as fallback |
| when Maven Central fails.""" |
| class MavenCentralHandler(socketserver.BaseRequestHandler): |
| timeout = 1 |
| |
| def handle(self): |
| # Simulate Maven Central returning 403 Forbidden |
| self.request.sendall(b'HTTP/1.1 403 Forbidden\n\n') |
| |
| # Set up Maven Central server (will return 403) |
| maven_port, = subprocess_server.pick_port(None) |
| maven_server = socketserver.TCPServer(('localhost', maven_port), |
| MavenCentralHandler) |
| maven_thread = threading.Thread(target=maven_server.handle_request) |
| maven_thread.daemon = True |
| maven_thread.start() |
| |
| # Temporarily replace the Maven Central constant to use our test server |
| original_maven_central = ( |
| subprocess_server.JavaJarServer.MAVEN_CENTRAL_REPOSITORY) |
| |
| try: |
| subprocess_server.JavaJarServer.MAVEN_CENTRAL_REPOSITORY = ( |
| f'http://localhost:{maven_port}/maven2') |
| |
| with tempfile.TemporaryDirectory() as temp_dir: |
| # Use a Maven Central URL that will trigger the fallback to real |
| # Google mirror |
| maven_url = ( |
| f'http://localhost:{maven_port}/maven2/org/apache/beam/' |
| f'beam-sdks-java-extensions-schemaio-expansion-service/2.63.0/' |
| f'beam-sdks-java-extensions-schemaio-expansion-service-2.63.0.jar') |
| |
| # This should fail on our mock Maven Central and fallback to the |
| # real Google mirror |
| jar_path = subprocess_server.JavaJarServer.local_jar( |
| maven_url, temp_dir) |
| |
| # Verify the file was downloaded successfully (from the real Google |
| # mirror) |
| self.assertTrue(os.path.exists(jar_path)) |
| jar_size = os.path.getsize(jar_path) |
| self.assertTrue(jar_size > 0) # Should have actual content |
| |
| finally: |
| # Restore original constants |
| subprocess_server.JavaJarServer.MAVEN_CENTRAL_REPOSITORY = ( |
| original_maven_central) |
| |
| @unittest.skipUnless(shutil.which('javac'), 'missing java jdk') |
| def test_classpath_jar(self): |
| with tempfile.TemporaryDirectory() as temp_dir: |
| try: |
| # Avoid having to prefix everything in our test strings. |
| oldwd = os.getcwd() |
| os.chdir(temp_dir) |
| |
| with open('Main.java', 'w') as fout: |
| fout.write( |
| """ |
| public class Main { |
| public static void main(String[] args) { Other.greet(); } |
| } |
| """) |
| |
| with open('Other.java', 'w') as fout: |
| fout.write( |
| """ |
| public class Other { |
| public static void greet() { System.out.println("You got me!"); } |
| } |
| """) |
| |
| os.mkdir('jars') |
| # Using split just for readability/copyability. |
| subprocess.check_call('javac Main.java Other.java'.split()) |
| subprocess.check_call('jar cfe jars/Main.jar Main Main.class'.split()) |
| subprocess.check_call('jar cf jars/Other.jar Other.class'.split()) |
| # Make sure the java and class files don't get picked up. |
| for path in glob.glob('*.*'): |
| os.unlink(path) |
| |
| # These should fail. |
| self.assertNotEqual( |
| subprocess.call('java -jar jars/Main.jar'.split()), 0) |
| self.assertNotEqual( |
| subprocess.call('java -jar jars/Other.jar'.split()), 0) |
| |
| os.mkdir('beam_temp') |
| composite_jar = subprocess_server.JavaJarServer.make_classpath_jar( |
| 'jars/Main.jar', ['jars/Other.jar'], cache_dir='beam_temp') |
| # This, however, should work. |
| subprocess.check_call(f'java -jar {composite_jar}'.split()) |
| |
| finally: |
| os.chdir(oldwd) |
| |
| |
| class CacheTest(unittest.TestCase): |
| @staticmethod |
| def with_prefix(prefix): |
| return '%s-%s' % (prefix, random.random()) |
| |
| def test_memoization(self): |
| cache = subprocess_server._SharedCache(self.with_prefix, lambda x: None) |
| try: |
| token = cache.register() |
| a = cache.get('a') |
| self.assertEqual(a[0], 'a') |
| self.assertEqual(cache.get('a'), a) |
| b = cache.get('b') |
| self.assertEqual(b[0], 'b') |
| self.assertEqual(cache.get('b'), b) |
| finally: |
| cache.purge(token) |
| |
| def test_purged(self): |
| cache = subprocess_server._SharedCache(self.with_prefix, lambda x: None) |
| try: |
| token = cache.register() |
| a = cache.get('a') |
| self.assertEqual(cache.get('a'), a) |
| finally: |
| cache.purge(token) |
| |
| try: |
| token = cache.register() |
| new_a = cache.get('a') |
| self.assertNotEqual(new_a, a) |
| finally: |
| cache.purge(token) |
| |
| def test_multiple_owners(self): |
| cache = subprocess_server._SharedCache(self.with_prefix, lambda x: None) |
| try: |
| owner1 = cache.register() |
| a = cache.get('a') |
| try: |
| self.assertEqual(cache.get('a'), a) |
| owner2 = cache.register() |
| b = cache.get('b') |
| self.assertEqual(cache.get('b'), b) |
| finally: |
| cache.purge(owner2) |
| self.assertEqual(cache.get('a'), a) |
| self.assertEqual(cache.get('b'), b) |
| finally: |
| cache.purge(owner1) |
| |
| try: |
| owner3 = cache.register() |
| self.assertNotEqual(cache.get('a'), a) |
| self.assertNotEqual(cache.get('b'), b) |
| finally: |
| cache.purge(owner3) |
| |
| def test_interleaved_owners(self): |
| cache = subprocess_server._SharedCache(self.with_prefix, lambda x: None) |
| owner1 = cache.register() |
| a = cache.get('a') |
| self.assertEqual(cache.get('a'), a) |
| |
| owner2 = cache.register() |
| b = cache.get('b') |
| self.assertEqual(cache.get('b'), b) |
| |
| cache.purge(owner1) |
| self.assertNotEqual(cache.get('a'), a) |
| self.assertEqual(cache.get('b'), b) |
| |
| cache.purge(owner2) |
| owner3 = cache.register() |
| self.assertNotEqual(cache.get('b'), b) |
| cache.purge(owner3) |
| |
| def test_destructor_exception_partial_state(self): |
| # In SubprocessServer.stop_process(), we need to make sure self._owner_id is always |
| # set to None if it is not already set, even if a destructor exception happens |
| # during purge(owner_id). |
| |
| destructor_calls = [] |
| |
| def faulty_destructor(obj): |
| destructor_calls.append(obj) |
| raise RuntimeError("Destructor failed") |
| |
| custom_cache = subprocess_server._SharedCache( |
| lambda *args: "process_obj", faulty_destructor) |
| |
| class CustomServer(subprocess_server.SubprocessServer): |
| _cache = custom_cache |
| |
| def __init__(self): |
| super().__init__(lambda channel: None, ["dummy_cmd"], port=12345) |
| |
| server = CustomServer() |
| server.start_process() |
| owner_id = server._owner_id |
| self.assertIsNotNone(owner_id) |
| self.assertIn(owner_id, custom_cache._live_owners) |
| |
| # First stop attempt fails in the destructor |
| with self.assertRaises(RuntimeError): |
| server.stop_process() |
| |
| # Verify fixed state: owner is purged from cache set, AND self._owner_id is successfully cleared to None |
| self.assertNotIn(owner_id, custom_cache._live_owners) |
| self.assertIsNone(server._owner_id) |
| |
| # Second stop attempt safely does nothing (no ValueError raised) |
| try: |
| server.stop_process() |
| except ValueError: |
| self.fail("ValueError should not be raised here.") |
| |
| def test_duplicate_atexit_registration_on_restart(self): |
| # Make sure we don't have duplicate atexit registration when reusing a |
| # StopOnExistJobServer instance. |
| |
| class DummyJobServer(job_server.JobServer): |
| def start(self): |
| return "localhost:8080" |
| |
| def stop(self): |
| pass |
| |
| wrapper = job_server.StopOnExitJobServer(DummyJobServer()) |
| |
| registered_callbacks = [] |
| |
| def mock_register(cb): |
| registered_callbacks.append(cb) |
| |
| def mock_unregister(cb): |
| if cb in registered_callbacks: |
| registered_callbacks.remove(cb) |
| |
| with patch('atexit.register', side_effect=mock_register), \ |
| patch('atexit.unregister', side_effect=mock_unregister, create=True): |
| # First start registers stop callback |
| wrapper.start() |
| self.assertTrue(wrapper._started) |
| self.assertEqual(len(registered_callbacks), 1) |
| |
| # Explicit stop clears _started AND unregisters the callback |
| wrapper.stop() |
| self.assertFalse(wrapper._started) |
| self.assertEqual(len(registered_callbacks), 0) |
| |
| # Re-starting registers the callback again, leaving exactly 1 active callback |
| wrapper.start() |
| self.assertTrue(wrapper._started) |
| self.assertEqual(len(registered_callbacks), 1) |
| |
| def test_concurrent_purge_race_condition(self): |
| # Concurrent threads attempting to check membership and call purge for the same owner. |
| # Here we explicitly define a synchronized dict to mimic the behavior of _live_owners. |
| # This dict will block two threads on __contains__, allowing us to test the race condition. |
| cache = subprocess_server._SharedCache(lambda x: "obj", lambda x: None) |
| owner = cache.register() |
| |
| barrier = threading.Barrier(2) |
| exceptions = [] |
| |
| class SynchronizedDict(dict): |
| def __contains__(self, item): |
| res = super().__contains__(item) |
| try: |
| # Force both threads to align right after checking membership but before removal |
| barrier.wait(timeout=0.2) |
| except threading.BrokenBarrierError: |
| pass |
| return res |
| |
| cache._live_owners = SynchronizedDict(cache._live_owners) |
| |
| def purge_worker(): |
| try: |
| cache.purge(owner) |
| except Exception as e: |
| exceptions.append(e) |
| |
| t1 = threading.Thread(target=purge_worker) |
| t2 = threading.Thread(target=purge_worker) |
| |
| t1.start() |
| t2.start() |
| |
| t1.join() |
| t2.join() |
| |
| # Both threads should succeed cleanly without raising an exception under idempotent purging. |
| self.assertEqual(len(exceptions), 0) |
| |
| def test_stop_process_after_cache_purged(self): |
| # Reproduce the ValueError when stop_process() (called by atexit) |
| # runs after the cache/owner was already purged during test teardown. |
| cache = subprocess_server._SharedCache( |
| lambda *args: "dummy_process", lambda obj: None) |
| |
| class DummySubprocessServer(subprocess_server.SubprocessServer): |
| _cache = cache |
| |
| def __init__(self): |
| super().__init__(lambda channel: None, ["dummy_cmd"], port=12345) |
| |
| server = DummySubprocessServer() |
| server.start_process() |
| owner_id = server._owner_id |
| |
| # Simulate pipeline context exit or test teardown purging the cache directly |
| cache.purge(owner_id) |
| |
| # Calling stop_process() (which happens during atexit) should succeed cleanly |
| # without raising ValueError. |
| server.stop_process() |
| |
| def test_force_remove(self): |
| destructor_calls = [] |
| |
| def custom_destructor(obj): |
| destructor_calls.append(obj) |
| |
| cache = subprocess_server._SharedCache(self.with_prefix, custom_destructor) |
| |
| owner1 = cache.register() |
| owner2 = cache.register() |
| |
| # Get object 'a' under both active owners |
| a = cache.get('a') |
| self.assertEqual(a[0], 'a') |
| self.assertIn(('a', ), cache._cache) |
| |
| # force_remove on a non-existent key should be a safe no-op |
| cache.force_remove('non_existent') |
| |
| # Call force_remove, which should bypass the owners check and delete it immediately |
| cache.force_remove('a') |
| |
| # The cache entry should be gone |
| self.assertNotIn(('a', ), cache._cache) |
| |
| # Destructor must be called on 'a' |
| self.assertEqual(destructor_calls, [a]) |
| |
| # Retrieving 'a' again under the active owners should construct a new object |
| new_a = cache.get('a') |
| self.assertNotEqual(new_a, a) |
| self.assertEqual(new_a[0], 'a') |
| |
| # Clean up |
| cache.purge(owner1) |
| cache.purge(owner2) |
| |
| def test_subprocess_server_start_failed_no_leak(self): |
| destructor_calls = [] |
| |
| def custom_destructor(obj): |
| destructor_calls.append(obj) |
| |
| class DummyProcess: |
| def __init__(self): |
| self.args = ["dummy_cmd"] |
| |
| def poll(self): |
| return 1 # Simulate that process exited/failed |
| |
| dummy_process = DummyProcess() |
| cache = subprocess_server._SharedCache( |
| lambda *args: (dummy_process, "localhost:12345"), custom_destructor) |
| |
| # 1. Register an independent, unrelated owner in the cache first. |
| other_owner = cache.register() |
| |
| class CustomServer(subprocess_server.SubprocessServer): |
| _cache = cache |
| |
| def __init__(self): |
| super().__init__(lambda channel: None, ["dummy_cmd"], port=12345) |
| |
| server = CustomServer() |
| # Fetch the process using other_owner, creating the cache entry and registering other_owner on it. |
| cache.get(tuple(server._cmd), server._port, server._logger) |
| |
| cache_key = (tuple(server._cmd), server._port, server._logger) |
| self.assertIn(cache_key, cache._cache) |
| self.assertEqual(cache._cache[cache_key].owners, {other_owner}) |
| |
| # 2. Verify starting the server (which registers its own owner and retrieves from cache) raises RuntimeError |
| with self.assertRaises(RuntimeError): |
| server.start() |
| |
| # 3. Verify that the destructor was called on the process, meaning no leak (even though other_owner was still registered!) |
| self.assertEqual(destructor_calls, [(dummy_process, "localhost:12345")]) |
| |
| # 4. Verify that the server has cleaned up its owner_id |
| self.assertIsNone(server._owner_id) |
| |
| # 5. Verify the cache entry has been removed completely |
| self.assertNotIn(cache_key, cache._cache) |
| |
| # Clean up the other owner |
| cache.purge(other_owner) |
| |
| def test_non_context_owners_do_not_share_keys(self): |
| cache = subprocess_server._SharedCache(self.with_prefix, lambda x: None) |
| # owner1 is a non-context owner (e.g., prism) |
| owner1 = cache.register(is_context=False) |
| a = cache.get('a', owner=owner1) |
| |
| # owner2 is another non-context owner (e.g., short-lived expansion service) |
| owner2 = cache.register(is_context=False) |
| b = cache.get('b', owner=owner2) |
| |
| # Verify that owner1 does not own 'b' |
| self.assertNotIn(owner1, cache._cache[('b', )].owners) |
| |
| # Verify that owner2 does not own 'a' |
| self.assertNotIn(owner2, cache._cache[('a', )].owners) |
| |
| # Purging owner2 should immediately destroy/remove 'b' |
| cache.purge(owner2) |
| self.assertNotIn(('b', ), cache._cache) |
| |
| # 'a' is still alive because owner1 is still registered |
| self.assertIn(('a', ), cache._cache) |
| |
| # Purging owner1 should destroy/remove 'a' |
| cache.purge(owner1) |
| self.assertNotIn(('a', ), cache._cache) |
| |
| def test_context_owner_owns_all_keys(self): |
| cache = subprocess_server._SharedCache(self.with_prefix, lambda x: None) |
| # owner1 is a non-context owner (e.g., prism) |
| owner1 = cache.register(is_context=False) |
| |
| # owner2 is a context owner (e.g., cache_subprocesses) |
| owner2 = cache.register(is_context=True) |
| |
| # owner3 is another non-context owner (e.g., short-lived service) |
| owner3 = cache.register(is_context=False) |
| |
| # owner3 requests 'b' |
| b = cache.get('b', owner=owner3) |
| |
| # owner2 (context) should own 'b' |
| self.assertIn(owner2, cache._cache[('b', )].owners) |
| |
| # owner1 (non-context) should NOT own 'b' |
| self.assertNotIn(owner1, cache._cache[('b', )].owners) |
| |
| |
| if __name__ == '__main__': |
| unittest.main() |