This is an automated email from the ASF dual-hosted git repository.
taragolis pushed a commit to branch main
in repository https://gitbox.apache.org/repos/asf/airflow.git
The following commit(s) were added to refs/heads/main by this push:
new b1092582f3 Extend exclusions configurations in
`tests/always/test_example_dags.py` (#39468)
b1092582f3 is described below
commit b1092582f3077bf0b812569f217a229892db1454
Author: Andrey Anshin <[email protected]>
AuthorDate: Wed May 8 15:27:38 2024 +0400
Extend exclusions configurations in `tests/always/test_example_dags.py`
(#39468)
---
tests/_internals/capture_warnings.py | 7 +-
tests/always/test_example_dags.py | 141 +++++++++++++++++++++++++++++------
tests/deprecations_ignore.yml | 3 -
3 files changed, 123 insertions(+), 28 deletions(-)
diff --git a/tests/_internals/capture_warnings.py
b/tests/_internals/capture_warnings.py
index fe3b96fea2..16b220989b 100644
--- a/tests/_internals/capture_warnings.py
+++ b/tests/_internals/capture_warnings.py
@@ -60,6 +60,7 @@ class CapturedWarning:
lineno: int
when: WhenTypeDef
node_id: str | None = None
+ param_id: str | None = None
@classmethod
def from_record(
@@ -68,13 +69,17 @@ class CapturedWarning:
category = warning_message.category.__name__
if (category_module := warning_message.category.__module__) !=
"builtins":
category = f"{category_module}.{category}"
+ param_id = None
if node_id:
# Remove parametrized part from the test node
- node_id, *_ = node_id.partition("[")
+ node_id, _, param_part = node_id.partition("[")
+ if param_part:
+ param_id = param_part[:-1] or None
return cls(
category=category,
message=str(warning_message.message),
node_id=node_id,
+ param_id=param_id,
when=when,
filename=_resolve_warning_filepath(warning_message.filename,
os.fspath(root_path)),
lineno=warning_message.lineno,
diff --git a/tests/always/test_example_dags.py
b/tests/always/test_example_dags.py
index c86ff3602d..3a0d947c8a 100644
--- a/tests/always/test_example_dags.py
+++ b/tests/always/test_example_dags.py
@@ -19,9 +19,12 @@ from __future__ import annotations
import os
import sys
from glob import glob
+from importlib import metadata as importlib_metadata
from pathlib import Path
import pytest
+from packaging.specifiers import SpecifierSet
+from packaging.version import Version
from airflow.models import DagBag
from airflow.utils import yaml
@@ -29,8 +32,54 @@ from tests.test_utils.asserts import assert_queries_count
AIRFLOW_SOURCES_ROOT = Path(__file__).resolve().parents[2]
AIRFLOW_PROVIDERS_ROOT = AIRFLOW_SOURCES_ROOT / "airflow" / "providers"
+CURRENT_PYTHON_VERSION = f"{sys.version_info.major}.{sys.version_info.minor}"
+NO_DB_QUERY_EXCEPTION = ("/airflow/example_dags/example_subdag_operator.py",)
+PROVIDERS_PREFIXES = ("airflow/providers/", "tests/system/providers/")
+OPTIONAL_PROVIDERS_DEPENDENCIES: dict[str, dict[str, str | None]] = {
+ # Some certain of examples/system tests might require additional
dependencies,
+ # which are not installed into specific CI check
+ # Format of dictionary:
+ # key: prefix of the file which need to be excluded,
+ # values: dictionary with package distributions and optional specifier,
e.g. >=2.3.4
+}
+IGNORE_AIRFLOW_PROVIDER_DEPRECATION_WARNING: tuple[str, ...] = (
+ # Some certain of examples/system tests might raise
AirflowProviderDeprecationWarning.
+ # In general, it should be resolved as soon as parameter/operator
deprecated,
+ # however we might postpone change for a while, in this case we should add
it into this tuple
+ # and create the appropriate task in GitHub
+ "tests/system/providers/amazon/aws/example_ecs_fargate.py",
+ "tests/system/providers/amazon/aws/example_eks_with_nodegroups.py",
+ "tests/system/providers/amazon/aws/example_emr.py",
+ "tests/system/providers/amazon/aws/example_emr_notebook_execution.py",
+ "tests/system/providers/dbt/cloud/example_dbt_cloud.py",
+ "tests/system/providers/docker/example_docker_swarm.py",
+
"tests/system/providers/google/cloud/azure/example_azure_fileshare_to_gcs.py",
+
"tests/system/providers/google/cloud/bigquery/example_bigquery_operations.py",
+ "tests/system/providers/google/cloud/bigquery/example_bigquery_sensors.py",
+ "tests/system/providers/google/cloud/dataproc/example_dataproc_gke.py",
+ "tests/system/providers/google/cloud/gcs/example_gcs_sensor.py",
+ "tests/system/providers/google/cloud/gcs/example_gcs_to_gcs.py",
+
"tests/system/providers/google/cloud/kubernetes_engine/example_kubernetes_engine.py",
+
"tests/system/providers/google/cloud/kubernetes_engine/example_kubernetes_engine_async.py",
+
"tests/system/providers/google/cloud/kubernetes_engine/example_kubernetes_engine_job.py",
+
"tests/system/providers/google/cloud/kubernetes_engine/example_kubernetes_engine_kueue.py",
+
"tests/system/providers/google/cloud/kubernetes_engine/example_kubernetes_engine_resource.py",
+
"tests/system/providers/google/cloud/life_sciences/example_life_sciences.py",
+ "tests/system/providers/google/marketing_platform/example_analytics.py",
+ "tests/system/providers/weaviate/example_weaviate_cohere.py",
+ "tests/system/providers/weaviate/example_weaviate_openai.py",
+ "tests/system/providers/weaviate/example_weaviate_operator.py",
+ # Deprecated Operators/Hooks, which replaced by common.sql Operators/Hooks
+ "tests/system/providers/apache/drill/example_drill_dag.py",
+ "tests/system/providers/jdbc/example_jdbc_queries.py",
+ "tests/system/providers/microsoft/mssql/example_mssql.py",
+ "tests/system/providers/mysql/example_mysql.py",
+ "tests/system/providers/postgres/example_postgres.py",
+ "tests/system/providers/snowflake/example_snowflake.py",
+ "tests/system/providers/sqlite/example_sqlite.py",
+ "tests/system/providers/trino/example_trino.py",
+)
-NO_DB_QUERY_EXCEPTION = ["/airflow/example_dags/example_subdag_operator.py"]
if os.environ.get("PYDANTIC", "v2") != "v2":
pytest.skip(
@@ -38,6 +87,18 @@ if os.environ.get("PYDANTIC", "v2") != "v2":
)
+def match_optional_dependencies(distribution_name: str, specifier: str | None)
-> tuple[bool, str]:
+ try:
+ package_version =
Version(importlib_metadata.version(distribution_name))
+ except ImportError:
+ return False, f"{distribution_name!r} not installed."
+
+ if specifier and package_version not in SpecifierSet(specifier):
+ return False, f"{distribution_name!r} required {specifier}, but
installed {package_version}."
+
+ return True, ""
+
+
def get_suspended_providers_folders() -> list[str]:
"""
Returns a list of suspended providers folders that should be
@@ -61,11 +122,10 @@ def get_python_excluded_providers_folders() -> list[str]:
skipped when running tests (without any prefix - for example apache/beam,
yandex, google etc.).
"""
excluded_providers = []
- current_python_version =
f"{sys.version_info.major}.{sys.version_info.minor}"
for provider_path in AIRFLOW_PROVIDERS_ROOT.rglob("provider.yaml"):
provider_yaml = yaml.safe_load(provider_path.read_text())
excluded_python_versions =
provider_yaml.get("excluded-python-versions", [])
- if current_python_version in excluded_python_versions:
+ if CURRENT_PYTHON_VERSION in excluded_python_versions:
excluded_providers.append(
provider_path.parent.relative_to(AIRFLOW_SOURCES_ROOT)
.as_posix()
@@ -74,29 +134,62 @@ def get_python_excluded_providers_folders() -> list[str]:
return excluded_providers
-def example_not_excluded_dags():
+def example_not_excluded_dags(xfail_db_exception: bool = False):
example_dirs = ["airflow/**/example_dags/example_*.py",
"tests/system/**/example_*.py"]
- excluded_providers_folders = get_suspended_providers_folders()
- excluded_providers_folders.extend(get_python_excluded_providers_folders())
- possible_prefixes = ["airflow/providers/", "tests/system/providers/"]
+ suspended_providers_folders = get_suspended_providers_folders()
+ current_python_excluded_providers_folders =
get_python_excluded_providers_folders()
suspended_providers_folders = [
AIRFLOW_SOURCES_ROOT.joinpath(prefix, provider).as_posix()
- for prefix in possible_prefixes
- for provider in excluded_providers_folders
+ for prefix in PROVIDERS_PREFIXES
+ for provider in suspended_providers_folders
+ ]
+ current_python_excluded_providers_folders = [
+ AIRFLOW_SOURCES_ROOT.joinpath(prefix, provider).as_posix()
+ for prefix in PROVIDERS_PREFIXES
+ for provider in current_python_excluded_providers_folders
]
+ providers_folders = tuple([AIRFLOW_SOURCES_ROOT.joinpath(pp).as_posix()
for pp in PROVIDERS_PREFIXES])
+
for example_dir in example_dirs:
candidates = glob(f"{AIRFLOW_SOURCES_ROOT.as_posix()}/{example_dir}",
recursive=True)
- for candidate in candidates:
- if not candidate.startswith(tuple(suspended_providers_folders)):
- yield candidate
-
-
-def example_dags_except_db_exception():
- return [
- dag_file
- for dag_file in example_not_excluded_dags()
- if not dag_file.endswith(tuple(NO_DB_QUERY_EXCEPTION))
- ]
+ for candidate in sorted(candidates):
+ param_marks = []
+
+ if candidate.startswith(tuple(suspended_providers_folders)):
+ param_marks.append(pytest.mark.skip(reason="Suspended
provider"))
+
+ if
candidate.startswith(tuple(current_python_excluded_providers_folders)):
+ param_marks.append(
+ pytest.mark.skip(reason=f"Not supported for Python
{CURRENT_PYTHON_VERSION}")
+ )
+
+ for optional, dependencies in
OPTIONAL_PROVIDERS_DEPENDENCIES.items():
+ if candidate.endswith(optional):
+ for distribution_name, specifier in dependencies.items():
+ result, reason =
match_optional_dependencies(distribution_name, specifier)
+ if not result:
+ param_marks.append(pytest.mark.skip(reason=reason))
+
+ if xfail_db_exception and
candidate.endswith(NO_DB_QUERY_EXCEPTION):
+ # Use strict XFAIL for excluded tests. So if it is not failed,
we should remove from the list.
+ param_marks.append(pytest.mark.xfail(reason="Expected DB
call", strict=True))
+
+ if candidate.startswith(providers_folders):
+ # Do not raise error in case of
airflow.exceptions.RemovedInAirflow3Warning
+ # We do not want to force change to new syntax in providers
ASAP
+ # because we might not release Airflow which deprecate some
feature
+ # Instead of that better to analyze warning report time to
time, and manually change it
+ param_marks.append(
+
pytest.mark.filterwarnings("default::airflow.exceptions.RemovedInAirflow3Warning")
+ )
+ if
candidate.endswith(IGNORE_AIRFLOW_PROVIDER_DEPRECATION_WARNING):
+ param_marks.append(
+ pytest.mark.filterwarnings(
+
"default::airflow.exceptions.AirflowProviderDeprecationWarning"
+ )
+ )
+
+ yield pytest.param(candidate, marks=tuple(param_marks),
id=relative_path(candidate))
def relative_path(path):
@@ -104,8 +197,8 @@ def relative_path(path):
@pytest.mark.db_test
[email protected]("example", example_not_excluded_dags(),
ids=relative_path)
-def test_should_be_importable(example):
[email protected]("example", example_not_excluded_dags())
+def test_should_be_importable(example: str):
dagbag = DagBag(
dag_folder=example,
include_examples=False,
@@ -115,8 +208,8 @@ def test_should_be_importable(example):
@pytest.mark.db_test
[email protected]("example", example_dags_except_db_exception(),
ids=relative_path)
-def test_should_not_do_database_queries(example):
[email protected]("example",
example_not_excluded_dags(xfail_db_exception=True))
+def test_should_not_do_database_queries(example: str):
with assert_queries_count(0, stacklevel_from_module=example.rsplit(os.sep,
1)[-1]):
DagBag(
dag_folder=example,
diff --git a/tests/deprecations_ignore.yml b/tests/deprecations_ignore.yml
index 91c05b3bd2..ef5b7332b7 100644
--- a/tests/deprecations_ignore.yml
+++ b/tests/deprecations_ignore.yml
@@ -33,9 +33,6 @@
-
tests/always/test_connection.py::TestConnection::test_connection_get_uri_from_conn
-
tests/always/test_connection.py::TestConnection::test_connection_get_uri_from_uri
- tests/always/test_connection.py::TestConnection::test_from_json_extra
-# `test_should_be_importable` and `test_should_not_do_database_queries` should
be resolved together
-- tests/always/test_example_dags.py::test_should_be_importable
-- tests/always/test_example_dags.py::test_should_not_do_database_queries
# API