blob: 43e3445e4c8cee87f8f7371dc40a3175153b69e3 [file] [log] [blame]
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
"""Module java gateway, contain gateway behavior."""
from __future__ import annotations
import contextlib
import warnings
from logging import getLogger
from typing import Any
from py4j.java_collections import JavaMap
from py4j.java_gateway import GatewayParameters, JavaGateway
from py4j.protocol import Py4JError
from pydolphinscheduler import __version__, configuration
from pydolphinscheduler.constants import JavaGatewayDefault, Version
from pydolphinscheduler.exceptions import PyDSJavaGatewayException
from pydolphinscheduler.utils.versions import version_match
logger = getLogger(__name__)
def gateway_result_checker(
result: JavaMap,
msg_check: str | None = JavaGatewayDefault.RESULT_MESSAGE_SUCCESS,
) -> Any:
"""Check weather java gateway result success or not."""
if (
result[JavaGatewayDefault.RESULT_STATUS_KEYWORD].toString()
!= JavaGatewayDefault.RESULT_STATUS_SUCCESS
):
raise PyDSJavaGatewayException("Failed when try to got result for java gateway")
if (
msg_check is not None
and result[JavaGatewayDefault.RESULT_MESSAGE_KEYWORD] != msg_check
):
raise PyDSJavaGatewayException("Get result state not success.")
return result
class GatewayEntryPoint:
"""Launch java gateway to pydolphin scheduler."""
def __init__(
self,
address: str | None = None,
port: int | None = None,
auto_convert: bool | None = True,
auth_token: str | None = None,
):
self._gateway = None
self.address = address or configuration.JAVA_GATEWAY_ADDRESS
self.port = port or configuration.JAVA_GATEWAY_PORT
self.auto_convert = auto_convert or configuration.JAVA_GATEWAY_AUTO_CONVERT
self.auth_token = auth_token or configuration.JAVA_GATEWAY_AUTH_TOKEN
gateway_version = "unknown"
with contextlib.suppress(Py4JError):
# 1. Java gateway version is too old: doesn't have method 'getGatewayVersion()'
# 2. Error connecting to Java gateway
gateway_version = self.get_gateway_version()
if (
not __version__.endswith("dev")
and gateway_version
and not version_match(Version.DS, gateway_version)
):
warnings.warn(
f"Using unmatched version of pydolphinscheduler (version {__version__}) "
f"and Java gateway (version {gateway_version}) may cause errors. "
"We strongly recommend you to find the matched version "
"(check: https://pypi.org/project/apache-dolphinscheduler)",
UserWarning,
stacklevel=2,
)
@property
def gateway(self) -> JavaGateway:
"""Launch java gateway to pydolphinscheduler.
TODO Note that automatic conversion makes calling Java methods slightly less efficient because
in the worst case, Py4J needs to go through all registered converters for all parameters.
This is why automatic conversion is disabled by default.
"""
if self._gateway is not None:
return self._gateway
configuration.token_alert(self.auth_token)
gateway_parameters = GatewayParameters(
address=self.address,
port=self.port,
auto_convert=self.auto_convert,
auth_token=self.auth_token,
)
self._gateway = JavaGateway(gateway_parameters=gateway_parameters)
return self._gateway
def get_gateway_version(self):
"""Get the java gateway version, expected to be equal with pydolphinscheduler."""
return self.gateway.entry_point.getGatewayVersion()
def get_datasource(self, name: str, type: str | None = None):
"""Get single datasource by java gateway.
Will use datasource_name to query database, and then filter by datasource_type if provided.
:param name: datasource name of the datasource to be queried
:param type: datasource type of the datasource, only used to filter the result.
"""
return self.gateway.entry_point.getDatasource(name, type)
def get_resources_file_info(self, program_type: str, main_package: str):
"""Get resources file info through java gateway."""
return self.gateway.entry_point.getResourcesFileInfo(program_type, main_package)
def create_or_update_resource(self, user_name: str, name: str, content: str):
"""Create or update resource through java gateway."""
return self.gateway.entry_point.createOrUpdateResource(user_name, name, content)
def query_resources_file_info(self, user_name: str, name: str):
"""Get resources file info through java gateway."""
return self.gateway.entry_point.queryResourcesFileInfo(user_name, name)
def query_environment_info(self, name: str):
"""Get environment info through java gateway."""
return self.gateway.entry_point.getEnvironmentInfo(name)
def get_code_and_version(
self, project_name: str, workflow_name: str, task_name: str
):
"""Get code and version through java gateway."""
return self.gateway.entry_point.getCodeAndVersion(
project_name, workflow_name, task_name
)
def create_or_grant_project(
self, user: str, name: str, description: str | None = None
):
"""Create or grant project through java gateway."""
return self.gateway.entry_point.createOrGrantProject(user, name, description)
def query_project_by_name(self, user: str, name: str):
"""Query project through java gateway."""
return self.gateway.entry_point.queryProjectByName(user, name)
def update_project(
self, user: str, project_code: int, project_name: str, description: str
):
"""Update project through java gateway."""
return self.gateway.entry_point.updateProject(
user, project_code, project_name, description
)
def delete_project(self, user: str, code: int):
"""Delete project through java gateway."""
return self.gateway.entry_point.deleteProject(user, code)
def create_tenant(
self, tenant_name: str, queue_name: str, description: str | None = None
):
"""Create tenant through java gateway."""
return self.gateway.entry_point.createTenant(
tenant_name, description, queue_name
)
def query_tenant(self, tenant_code: str):
"""Query tenant through java gateway."""
return self.gateway.entry_point.queryTenantByCode(tenant_code)
def grant_tenant_to_user(self, user_name: str, tenant_code: str):
"""Grant tenant to user through java gateway."""
return self.gateway.entry_point.grantTenantToUser(user_name, tenant_code)
def update_tenant(
self,
user: str,
tenant_id: int,
code: str,
queue_id: int,
description: str | None = None,
):
"""Update tenant through java gateway."""
return self.gateway.entry_point.updateTenant(
user, tenant_id, code, queue_id, description
)
def delete_tenant(self, user: str, tenant_id: int):
"""Delete tenant through java gateway."""
return self.gateway.entry_point.deleteTenantById(user, tenant_id)
def create_user(
self,
name: str,
password: str,
email: str,
phone: str,
tenant: str,
queue: str,
status: int,
):
"""Create user through java gateway."""
return self.gateway.entry_point.createUser(
name, password, email, phone, tenant, queue, status
)
def query_user(self, user_id: int):
"""Query user through java gateway."""
return self.gateway.queryUser(user_id)
def update_user(
self,
name: str,
password: str,
email: str,
phone: str,
tenant: str,
queue: str,
status: int,
):
"""Update user through java gateway."""
return self.gateway.entry_point.updateUser(
name, password, email, phone, tenant, queue, status
)
def delete_user(self, name: str, user_id: int):
"""Delete user through java gateway."""
return self.gateway.entry_point.deleteUser(name, user_id)
def get_dependent_info(
self,
project_name: str,
workflow_name: str,
task_name: str | None = None,
):
"""Get dependent info through java gateway."""
return self.gateway.entry_point.getDependentInfo(
project_name, workflow_name, task_name
)
def get_workflow_info(self, user_name: str, project_name: str, workflow_name: str):
"""Get workflow info through java gateway."""
return self.gateway.entry_point.getWorkflowInfo(
user_name, project_name, workflow_name
)
def create_or_update_workflow(
self,
user_name: str,
project_name: str,
name: str,
description: str,
global_params: str,
warning_type: str,
warning_group_id: int,
execution_type: str,
timeout: int,
worker_group: str,
release_state: int,
task_relation_json: str,
task_definition_json: str,
schedule: str | None = None,
online_schedule: bool | None = None,
other_params_json: str | None = None,
):
"""Create or update workflow through java gateway."""
return self.gateway.entry_point.createOrUpdateWorkflow(
user_name,
project_name,
name,
description,
global_params,
schedule,
online_schedule,
warning_type,
warning_group_id,
timeout,
worker_group,
release_state,
task_relation_json,
task_definition_json,
other_params_json,
execution_type,
)
def exec_workflow_instance(
self,
user_name: str,
project_name: str,
workflow_name: str,
cron_time: str,
worker_group: str,
warning_type: str,
warning_group_id: int,
timeout: int,
):
"""Exec workflow instance through java gateway."""
return self.gateway.entry_point.execWorkflowInstance(
user_name,
project_name,
workflow_name,
cron_time,
worker_group,
warning_type,
warning_group_id,
timeout,
)
gateway = GatewayEntryPoint()