Airflow Summit 2025 is coming October 07-09. Register now for early bird ticket!

Source code for tests.system.openlineage.example_openlineage_defer_simple_dag

# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements.  See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership.  The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License.  You may obtain a copy of the License at
#
#   http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied.  See the License for the
# specific language governing permissions and limitations
# under the License.
"""
Simple DAG with deferrable operator.

It checks:
    - that at least two task START events (before and after deferral) are emitted and
      the try_num remains at 1
"""

from __future__ import annotations

import warnings
from datetime import datetime, timedelta

from airflow import DAG
from airflow.exceptions import AirflowProviderDeprecationWarning
from airflow.models import Variable
from airflow.providers.standard.operators.python import PythonOperator
from airflow.providers.standard.sensors.time_delta import TimeDeltaSensorAsync

from system.openlineage.expected_events import get_expected_event_file_path
from system.openlineage.operator import OpenLineageTestOperator


[docs] def check_events_number_func(): events = Variable.get(key="openlineage_defer_simple_dag.wait.event.start", deserialize_json=True) if len(events) < 2: raise ValueError(f"Expected at least 2 START events for task `wait`, got {len(events)}")
[docs] DAG_ID = "openlineage_defer_simple_dag"
with DAG( dag_id=DAG_ID, start_date=datetime(2021, 1, 1), schedule=None, catchup=False, default_args={"retries": 0}, ) as dag: # Timedelta is compared to the DAGRun start timestamp, which can occur long before a worker picks up the # task. We need to ensure the sensor gets deferred at least once, so setting 180s. with warnings.catch_warnings(): # TODO Switch to TimeDeltaSensor when deferrable is released warnings.simplefilter("ignore", AirflowProviderDeprecationWarning)
[docs] wait = TimeDeltaSensorAsync(task_id="wait", delta=timedelta(seconds=180))
check_events_number = PythonOperator( task_id="check_events_number", python_callable=check_events_number_func ) check_events = OpenLineageTestOperator( task_id="check_events", file_path=get_expected_event_file_path(DAG_ID), allow_duplicate_events=True, ) wait >> check_events_number >> check_events from tests_common.test_utils.system_tests import get_test_run # noqa: E402 # Needed to run the example DAG with pytest (see: tests/system/README.md#run_via_pytest)
[docs] test_run = get_test_run(dag)

Was this entry helpful?