blob: a0fccb8131c4a55fcb5bcad75848e60360dcc8b3 [file] [log] [blame]
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
"""Concurrency concepts that support efficient multi-threading."""
import os
from concurrent.futures import Executor, ThreadPoolExecutor
from pyiceberg.utils.config import Config
class ExecutorFactory:
_instance: Executor | None = None
_instance_pid: int | None = None
@staticmethod
def max_workers() -> int | None:
"""Return the max number of workers configured."""
return Config().get_int("max-workers")
@staticmethod
def get_or_create() -> Executor:
"""Return the same executor in each call."""
# ThreadPoolExecutor cannot be shared across processes. If a new pid is found it means
# there is a new process so a new executor is needed. Otherwise, the executor may be in
# an invalid state and tasks submitted will not be started.
if ExecutorFactory._instance_pid != os.getpid():
ExecutorFactory._instance_pid = os.getpid()
ExecutorFactory._instance = None
if ExecutorFactory._instance is None:
max_workers = ExecutorFactory.max_workers()
ExecutorFactory._instance = ThreadPoolExecutor(max_workers=max_workers)
return ExecutorFactory._instance