airflow prev_dagrun_dep 源码
airflow prev_dagrun_dep 代码
文件路径:/airflow/ti_deps/deps/prev_dagrun_dep.py
#
# Licensed to the Apache Software Foundation (ASF) under one
# or more contributor license agreements. See the NOTICE file
# distributed with this work for additional information
# regarding copyright ownership. The ASF licenses this file
# to you under the Apache License, Version 2.0 (the
# "License"); you may not use this file except in compliance
# with the License. You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing,
# software distributed under the License is distributed on an
# "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
# KIND, either express or implied. See the License for the
# specific language governing permissions and limitations
# under the License.
from __future__ import annotations
from sqlalchemy import func
from airflow.models.taskinstance import TaskInstance as TI
from airflow.ti_deps.deps.base_ti_dep import BaseTIDep
from airflow.utils.session import provide_session
from airflow.utils.state import State
class PrevDagrunDep(BaseTIDep):
"""
Is the past dagrun in a state that allows this task instance to run, e.g. did this
task instance's task in the previous dagrun complete if we are depending on past.
"""
NAME = "Previous Dagrun State"
IGNORABLE = True
IS_TASK_DEP = True
@provide_session
def _get_dep_statuses(self, ti: TI, session, dep_context):
if dep_context.ignore_depends_on_past:
reason = "The context specified that the state of past DAGs could be ignored."
yield self._passing_status(reason=reason)
return
if not ti.task.depends_on_past:
yield self._passing_status(reason="The task did not have depends_on_past set.")
return
dr = ti.get_dagrun(session=session)
if not dr:
yield self._passing_status(reason="This task instance does not belong to a DAG.")
return
# Don't depend on the previous task instance if we are the first task.
catchup = ti.task.dag and ti.task.dag.catchup
if catchup:
last_dagrun = dr.get_previous_scheduled_dagrun(session)
else:
last_dagrun = dr.get_previous_dagrun(session=session)
# First ever run for this DAG.
if not last_dagrun:
yield self._passing_status(reason="This task instance was the first task instance for its task.")
return
# There was a DAG run, but the task wasn't active back then.
if catchup and last_dagrun.execution_date < ti.task.start_date:
yield self._passing_status(reason="This task instance was the first task instance for its task.")
return
previous_ti = last_dagrun.get_task_instance(ti.task_id, session=session)
if not previous_ti:
if ti.task.ignore_first_depends_on_past:
has_historical_ti = (
session.query(func.count(TI.dag_id))
.filter(
TI.dag_id == ti.dag_id,
TI.task_id == ti.task_id,
TI.execution_date < ti.execution_date,
)
.scalar()
> 0
)
if not has_historical_ti:
yield self._passing_status(
reason="ignore_first_depends_on_past is true for this task "
"and it is the first task instance for its task."
)
return
yield self._failing_status(
reason="depends_on_past is true for this task's DAG, but the previous "
"task instance has not run yet."
)
return
if previous_ti.state not in {State.SKIPPED, State.SUCCESS}:
yield self._failing_status(
reason=(
f"depends_on_past is true for this task, but the previous task instance {previous_ti} "
f"is in the state '{previous_ti.state}' which is not a successful state."
)
)
previous_ti.task = ti.task
if ti.task.wait_for_downstream and not previous_ti.are_dependents_done(session=session):
yield self._failing_status(
reason=(
f"The tasks downstream of the previous task instance {previous_ti} haven't completed "
f"(and wait_for_downstream is True)."
)
)
相关信息
相关文章
airflow dag_ti_slots_available_dep 源码
airflow dagrun_backfill_dep 源码
airflow exec_date_after_start_date_dep 源码
airflow mapped_task_expanded 源码
0
赞
热门推荐
-
2、 - 优质文章
-
3、 gate.io
-
8、 golang
-
9、 openharmony
-
10、 Vue中input框自动聚焦