Extend exclusions configurations in `tests/always/test_example_dags.py` (#39468)
diff --git a/tests/_internals/capture_warnings.py b/tests/_internals/capture_warnings.py
index fe3b96f..16b2209 100644
--- a/tests/_internals/capture_warnings.py
+++ b/tests/_internals/capture_warnings.py
@@ -60,6 +60,7 @@
lineno: int
when: WhenTypeDef
node_id: str | None = None
+ param_id: str | None = None
@classmethod
def from_record(
@@ -68,13 +69,17 @@
category = warning_message.category.__name__
if (category_module := warning_message.category.__module__) != "builtins":
category = f"{category_module}.{category}"
+ param_id = None
if node_id:
# Remove parametrized part from the test node
- node_id, *_ = node_id.partition("[")
+ node_id, _, param_part = node_id.partition("[")
+ if param_part:
+ param_id = param_part[:-1] or None
return cls(
category=category,
message=str(warning_message.message),
node_id=node_id,
+ param_id=param_id,
when=when,
filename=_resolve_warning_filepath(warning_message.filename, os.fspath(root_path)),
lineno=warning_message.lineno,
diff --git a/tests/always/test_example_dags.py b/tests/always/test_example_dags.py
index c86ff36..3a0d947 100644
--- a/tests/always/test_example_dags.py
+++ b/tests/always/test_example_dags.py
@@ -19,9 +19,12 @@
import os
import sys
from glob import glob
+from importlib import metadata as importlib_metadata
from pathlib import Path
import pytest
+from packaging.specifiers import SpecifierSet
+from packaging.version import Version
from airflow.models import DagBag
from airflow.utils import yaml
@@ -29,8 +32,54 @@
AIRFLOW_SOURCES_ROOT = Path(__file__).resolve().parents[2]
AIRFLOW_PROVIDERS_ROOT = AIRFLOW_SOURCES_ROOT / "airflow" / "providers"
+CURRENT_PYTHON_VERSION = f"{sys.version_info.major}.{sys.version_info.minor}"
+NO_DB_QUERY_EXCEPTION = ("/airflow/example_dags/example_subdag_operator.py",)
+PROVIDERS_PREFIXES = ("airflow/providers/", "tests/system/providers/")
+OPTIONAL_PROVIDERS_DEPENDENCIES: dict[str, dict[str, str | None]] = {
+ # Some certain of examples/system tests might require additional dependencies,
+ # which are not installed into specific CI check
+ # Format of dictionary:
+ # key: prefix of the file which need to be excluded,
+ # values: dictionary with package distributions and optional specifier, e.g. >=2.3.4
+}
+IGNORE_AIRFLOW_PROVIDER_DEPRECATION_WARNING: tuple[str, ...] = (
+ # Some certain of examples/system tests might raise AirflowProviderDeprecationWarning.
+ # In general, it should be resolved as soon as parameter/operator deprecated,
+ # however we might postpone change for a while, in this case we should add it into this tuple
+ # and create the appropriate task in GitHub
+ "tests/system/providers/amazon/aws/example_ecs_fargate.py",
+ "tests/system/providers/amazon/aws/example_eks_with_nodegroups.py",
+ "tests/system/providers/amazon/aws/example_emr.py",
+ "tests/system/providers/amazon/aws/example_emr_notebook_execution.py",
+ "tests/system/providers/dbt/cloud/example_dbt_cloud.py",
+ "tests/system/providers/docker/example_docker_swarm.py",
+ "tests/system/providers/google/cloud/azure/example_azure_fileshare_to_gcs.py",
+ "tests/system/providers/google/cloud/bigquery/example_bigquery_operations.py",
+ "tests/system/providers/google/cloud/bigquery/example_bigquery_sensors.py",
+ "tests/system/providers/google/cloud/dataproc/example_dataproc_gke.py",
+ "tests/system/providers/google/cloud/gcs/example_gcs_sensor.py",
+ "tests/system/providers/google/cloud/gcs/example_gcs_to_gcs.py",
+ "tests/system/providers/google/cloud/kubernetes_engine/example_kubernetes_engine.py",
+ "tests/system/providers/google/cloud/kubernetes_engine/example_kubernetes_engine_async.py",
+ "tests/system/providers/google/cloud/kubernetes_engine/example_kubernetes_engine_job.py",
+ "tests/system/providers/google/cloud/kubernetes_engine/example_kubernetes_engine_kueue.py",
+ "tests/system/providers/google/cloud/kubernetes_engine/example_kubernetes_engine_resource.py",
+ "tests/system/providers/google/cloud/life_sciences/example_life_sciences.py",
+ "tests/system/providers/google/marketing_platform/example_analytics.py",
+ "tests/system/providers/weaviate/example_weaviate_cohere.py",
+ "tests/system/providers/weaviate/example_weaviate_openai.py",
+ "tests/system/providers/weaviate/example_weaviate_operator.py",
+ # Deprecated Operators/Hooks, which replaced by common.sql Operators/Hooks
+ "tests/system/providers/apache/drill/example_drill_dag.py",
+ "tests/system/providers/jdbc/example_jdbc_queries.py",
+ "tests/system/providers/microsoft/mssql/example_mssql.py",
+ "tests/system/providers/mysql/example_mysql.py",
+ "tests/system/providers/postgres/example_postgres.py",
+ "tests/system/providers/snowflake/example_snowflake.py",
+ "tests/system/providers/sqlite/example_sqlite.py",
+ "tests/system/providers/trino/example_trino.py",
+)
-NO_DB_QUERY_EXCEPTION = ["/airflow/example_dags/example_subdag_operator.py"]
if os.environ.get("PYDANTIC", "v2") != "v2":
pytest.skip(
@@ -38,6 +87,18 @@
)
+def match_optional_dependencies(distribution_name: str, specifier: str | None) -> tuple[bool, str]:
+ try:
+ package_version = Version(importlib_metadata.version(distribution_name))
+ except ImportError:
+ return False, f"{distribution_name!r} not installed."
+
+ if specifier and package_version not in SpecifierSet(specifier):
+ return False, f"{distribution_name!r} required {specifier}, but installed {package_version}."
+
+ return True, ""
+
+
def get_suspended_providers_folders() -> list[str]:
"""
Returns a list of suspended providers folders that should be
@@ -61,11 +122,10 @@
skipped when running tests (without any prefix - for example apache/beam, yandex, google etc.).
"""
excluded_providers = []
- current_python_version = f"{sys.version_info.major}.{sys.version_info.minor}"
for provider_path in AIRFLOW_PROVIDERS_ROOT.rglob("provider.yaml"):
provider_yaml = yaml.safe_load(provider_path.read_text())
excluded_python_versions = provider_yaml.get("excluded-python-versions", [])
- if current_python_version in excluded_python_versions:
+ if CURRENT_PYTHON_VERSION in excluded_python_versions:
excluded_providers.append(
provider_path.parent.relative_to(AIRFLOW_SOURCES_ROOT)
.as_posix()
@@ -74,29 +134,62 @@
return excluded_providers
-def example_not_excluded_dags():
+def example_not_excluded_dags(xfail_db_exception: bool = False):
example_dirs = ["airflow/**/example_dags/example_*.py", "tests/system/**/example_*.py"]
- excluded_providers_folders = get_suspended_providers_folders()
- excluded_providers_folders.extend(get_python_excluded_providers_folders())
- possible_prefixes = ["airflow/providers/", "tests/system/providers/"]
+ suspended_providers_folders = get_suspended_providers_folders()
+ current_python_excluded_providers_folders = get_python_excluded_providers_folders()
suspended_providers_folders = [
AIRFLOW_SOURCES_ROOT.joinpath(prefix, provider).as_posix()
- for prefix in possible_prefixes
- for provider in excluded_providers_folders
+ for prefix in PROVIDERS_PREFIXES
+ for provider in suspended_providers_folders
]
+ current_python_excluded_providers_folders = [
+ AIRFLOW_SOURCES_ROOT.joinpath(prefix, provider).as_posix()
+ for prefix in PROVIDERS_PREFIXES
+ for provider in current_python_excluded_providers_folders
+ ]
+ providers_folders = tuple([AIRFLOW_SOURCES_ROOT.joinpath(pp).as_posix() for pp in PROVIDERS_PREFIXES])
+
for example_dir in example_dirs:
candidates = glob(f"{AIRFLOW_SOURCES_ROOT.as_posix()}/{example_dir}", recursive=True)
- for candidate in candidates:
- if not candidate.startswith(tuple(suspended_providers_folders)):
- yield candidate
+ for candidate in sorted(candidates):
+ param_marks = []
+ if candidate.startswith(tuple(suspended_providers_folders)):
+ param_marks.append(pytest.mark.skip(reason="Suspended provider"))
-def example_dags_except_db_exception():
- return [
- dag_file
- for dag_file in example_not_excluded_dags()
- if not dag_file.endswith(tuple(NO_DB_QUERY_EXCEPTION))
- ]
+ if candidate.startswith(tuple(current_python_excluded_providers_folders)):
+ param_marks.append(
+ pytest.mark.skip(reason=f"Not supported for Python {CURRENT_PYTHON_VERSION}")
+ )
+
+ for optional, dependencies in OPTIONAL_PROVIDERS_DEPENDENCIES.items():
+ if candidate.endswith(optional):
+ for distribution_name, specifier in dependencies.items():
+ result, reason = match_optional_dependencies(distribution_name, specifier)
+ if not result:
+ param_marks.append(pytest.mark.skip(reason=reason))
+
+ if xfail_db_exception and candidate.endswith(NO_DB_QUERY_EXCEPTION):
+ # Use strict XFAIL for excluded tests. So if it is not failed, we should remove from the list.
+ param_marks.append(pytest.mark.xfail(reason="Expected DB call", strict=True))
+
+ if candidate.startswith(providers_folders):
+ # Do not raise error in case of airflow.exceptions.RemovedInAirflow3Warning
+ # We do not want to force change to new syntax in providers ASAP
+ # because we might not release Airflow which deprecate some feature
+ # Instead of that better to analyze warning report time to time, and manually change it
+ param_marks.append(
+ pytest.mark.filterwarnings("default::airflow.exceptions.RemovedInAirflow3Warning")
+ )
+ if candidate.endswith(IGNORE_AIRFLOW_PROVIDER_DEPRECATION_WARNING):
+ param_marks.append(
+ pytest.mark.filterwarnings(
+ "default::airflow.exceptions.AirflowProviderDeprecationWarning"
+ )
+ )
+
+ yield pytest.param(candidate, marks=tuple(param_marks), id=relative_path(candidate))
def relative_path(path):
@@ -104,8 +197,8 @@
@pytest.mark.db_test
-@pytest.mark.parametrize("example", example_not_excluded_dags(), ids=relative_path)
-def test_should_be_importable(example):
+@pytest.mark.parametrize("example", example_not_excluded_dags())
+def test_should_be_importable(example: str):
dagbag = DagBag(
dag_folder=example,
include_examples=False,
@@ -115,8 +208,8 @@
@pytest.mark.db_test
-@pytest.mark.parametrize("example", example_dags_except_db_exception(), ids=relative_path)
-def test_should_not_do_database_queries(example):
+@pytest.mark.parametrize("example", example_not_excluded_dags(xfail_db_exception=True))
+def test_should_not_do_database_queries(example: str):
with assert_queries_count(0, stacklevel_from_module=example.rsplit(os.sep, 1)[-1]):
DagBag(
dag_folder=example,
diff --git a/tests/deprecations_ignore.yml b/tests/deprecations_ignore.yml
index 91c05b3..ef5b733 100644
--- a/tests/deprecations_ignore.yml
+++ b/tests/deprecations_ignore.yml
@@ -33,9 +33,6 @@
- tests/always/test_connection.py::TestConnection::test_connection_get_uri_from_conn
- tests/always/test_connection.py::TestConnection::test_connection_get_uri_from_uri
- tests/always/test_connection.py::TestConnection::test_from_json_extra
-# `test_should_be_importable` and `test_should_not_do_database_queries` should be resolved together
-- tests/always/test_example_dags.py::test_should_be_importable
-- tests/always/test_example_dags.py::test_should_not_do_database_queries
# API