Re: [PR] Swap Dag Parsing to use the TaskSDK machinery. [airflow]

via GitHub Tue, 17 Dec 2024 13:58:49 -0800


jedcunningham commented on code in PR #44972:
URL: https://github.com/apache/airflow/pull/44972#discussion_r1889204926



##########
airflow/dag_processing/processor.py:
##########
@@ -16,610 +16,228 @@
 # under the License.
 from __future__ import annotations
 
-import importlib
-import logging
 import os
-import signal
-import threading
-import time
-import zipfile
-from collections.abc import Generator, Iterable
-from contextlib import contextmanager, redirect_stderr, redirect_stdout, 
suppress
-from dataclasses import dataclass
-from typing import TYPE_CHECKING
-
-from setproctitle import setproctitle
-from sqlalchemy import event
-
-from airflow import settings
+import sys
+import traceback
+from collections.abc import Generator
+from typing import TYPE_CHECKING, Annotated, Callable, Literal, Union
+
+import attrs
+import pydantic
+
 from airflow.callbacks.callback_requests import (
+    CallbackRequest,
     DagCallbackRequest,
     TaskCallbackRequest,
 )
 from airflow.configuration import conf
-from airflow.exceptions import AirflowException
-from airflow.models.dag import DAG
 from airflow.models.dagbag import DagBag
-from airflow.models.pool import Pool
-from airflow.models.serialized_dag import SerializedDagModel
-from airflow.models.taskinstance import TaskInstance, _run_finished_callback
+from airflow.sdk.execution_time.comms import GetConnection, GetVariable
+from airflow.sdk.execution_time.supervisor import WatchedSubprocess
+from airflow.serialization.serialized_objects import LazyDeserializedDAG, 
SerializedDAG
 from airflow.stats import Stats
-from airflow.utils import timezone
-from airflow.utils.file import iter_airflow_imports, might_contain_dag
-from airflow.utils.log.logging_mixin import LoggingMixin, StreamLogWriter, 
set_context
-from airflow.utils.mixins import MultiprocessingStartMethodMixin
-from airflow.utils.session import NEW_SESSION, provide_session
-from airflow.utils.state import TaskInstanceState
 
 if TYPE_CHECKING:
-    import multiprocessing
-    from datetime import datetime
-    from multiprocessing.connection import Connection as 
MultiprocessingConnection
-
-    from sqlalchemy.orm.session import Session
-
-    from airflow.callbacks.callback_requests import CallbackRequest
-    from airflow.models.operator import Operator
+    from airflow.typing_compat import Self
+    from airflow.utils.context import Context
+
+
+def _parse_file_entrypoint():
+    import os
+
+    import structlog
+
+    from airflow.sdk.execution_time import task_runner
+    # Parse DAG file, send JSON back up!
+
+    comms_decoder = task_runner.CommsDecoder[DagFileParseRequest, 
DagFileParsingResult](
+        input=sys.stdin,
+        decoder=pydantic.TypeAdapter[DagFileParseRequest](DagFileParseRequest),
+    )
+    msg = comms_decoder.get_message()
+    comms_decoder.request_socket = os.fdopen(msg.requests_fd, "wb", 
buffering=0)
+
+    log = structlog.get_logger(logger_name="task")
+
+    result = _parse_file(msg, log)
+    comms_decoder.send_request(log, result)
+
+
+def _parse_file(msg: DagFileParseRequest, log):

Review Comment:
   ```suggestion
   def _parse_file(msg: DagFileParseRequest, log: FilteringBoundLogger) -> 
DagFileParsingResult:
   ```
   
   I think it's a FilteringBoundLogger, yeah?



##########
airflow/dag_processing/processor.py:
##########
@@ -16,610 +16,228 @@
 # under the License.
 from __future__ import annotations
 
-import importlib
-import logging
 import os
-import signal
-import threading
-import time
-import zipfile
-from collections.abc import Generator, Iterable
-from contextlib import contextmanager, redirect_stderr, redirect_stdout, 
suppress
-from dataclasses import dataclass
-from typing import TYPE_CHECKING
-
-from setproctitle import setproctitle
-from sqlalchemy import event
-
-from airflow import settings
+import sys
+import traceback
+from collections.abc import Generator
+from typing import TYPE_CHECKING, Annotated, Callable, Literal, Union
+
+import attrs
+import pydantic
+
 from airflow.callbacks.callback_requests import (
+    CallbackRequest,
     DagCallbackRequest,
     TaskCallbackRequest,
 )
 from airflow.configuration import conf
-from airflow.exceptions import AirflowException
-from airflow.models.dag import DAG
 from airflow.models.dagbag import DagBag
-from airflow.models.pool import Pool
-from airflow.models.serialized_dag import SerializedDagModel
-from airflow.models.taskinstance import TaskInstance, _run_finished_callback
+from airflow.sdk.execution_time.comms import GetConnection, GetVariable
+from airflow.sdk.execution_time.supervisor import WatchedSubprocess
+from airflow.serialization.serialized_objects import LazyDeserializedDAG, 
SerializedDAG
 from airflow.stats import Stats
-from airflow.utils import timezone
-from airflow.utils.file import iter_airflow_imports, might_contain_dag
-from airflow.utils.log.logging_mixin import LoggingMixin, StreamLogWriter, 
set_context
-from airflow.utils.mixins import MultiprocessingStartMethodMixin
-from airflow.utils.session import NEW_SESSION, provide_session
-from airflow.utils.state import TaskInstanceState
 
 if TYPE_CHECKING:
-    import multiprocessing
-    from datetime import datetime
-    from multiprocessing.connection import Connection as 
MultiprocessingConnection
-
-    from sqlalchemy.orm.session import Session
-
-    from airflow.callbacks.callback_requests import CallbackRequest
-    from airflow.models.operator import Operator
+    from airflow.typing_compat import Self
+    from airflow.utils.context import Context
+
+
+def _parse_file_entrypoint():
+    import os
+
+    import structlog
+
+    from airflow.sdk.execution_time import task_runner
+    # Parse DAG file, send JSON back up!
+
+    comms_decoder = task_runner.CommsDecoder[DagFileParseRequest, 
DagFileParsingResult](
+        input=sys.stdin,
+        decoder=pydantic.TypeAdapter[DagFileParseRequest](DagFileParseRequest),
+    )
+    msg = comms_decoder.get_message()
+    comms_decoder.request_socket = os.fdopen(msg.requests_fd, "wb", 
buffering=0)
+
+    log = structlog.get_logger(logger_name="task")
+
+    result = _parse_file(msg, log)
+    comms_decoder.send_request(log, result)
+
+
+def _parse_file(msg: DagFileParseRequest, log):
+    # TODO: Set known_pool names on DagBag!
+    bag = DagBag(
+        dag_folder=msg.file,
+        include_examples=False,
+        safe_mode=True,
+        load_op_links=False,
+    )
+    serialized_dags, serialization_import_errors = _serialize_dags(bag, log)
+    bag.import_errors.update(serialization_import_errors)
+    dags = [LazyDeserializedDAG(data=serdag) for serdag in serialized_dags]
+    result = DagFileParsingResult(
+        fileloc=msg.file,
+        serialized_dags=dags,
+        import_errors=bag.import_errors,
+        # TODO: Make `bag.dag_warnings` not return SQLA model objects
+        warnings=[],
+    )
+
+    if msg.callback_requests:
+        _execute_callbacks(bag, msg.callback_requests, log)
+    return result
+
+
+def _serialize_dags(bag, log):
+    serialization_import_errors = {}
+    serialized_dags = []
+    for dag in bag.dags.values():
+        try:
+            serialized_dag = SerializedDAG.to_dict(dag)
+            serialized_dags.append(serialized_dag)
+        except Exception:
+            log.exception("Failed to serialize DAG: %s", dag.fileloc)
+            dagbag_import_error_traceback_depth = conf.getint(
+                "core", "dagbag_import_error_traceback_depth", fallback=None
+            )
+            serialization_import_errors[dag.fileloc] = traceback.format_exc(
+                limit=-dagbag_import_error_traceback_depth
+            )
+    return serialized_dags, serialization_import_errors
 
 
-@dataclass
-class _QueryCounter:
-    queries_number: int = 0
+def _execute_callbacks(dagbag: DagBag, callback_requests: 
list[CallbackRequest], log):

Review Comment:
   ```suggestion
   def _execute_callbacks(dagbag: DagBag, callback_requests: 
list[CallbackRequest], log) -> None:
   ```



##########
airflow/dag_processing/processor.py:
##########
@@ -16,610 +16,228 @@
 # under the License.
 from __future__ import annotations
 
-import importlib
-import logging
 import os
-import signal
-import threading
-import time
-import zipfile
-from collections.abc import Generator, Iterable
-from contextlib import contextmanager, redirect_stderr, redirect_stdout, 
suppress
-from dataclasses import dataclass
-from typing import TYPE_CHECKING
-
-from setproctitle import setproctitle
-from sqlalchemy import event
-
-from airflow import settings
+import sys
+import traceback
+from collections.abc import Generator
+from typing import TYPE_CHECKING, Annotated, Callable, Literal, Union
+
+import attrs
+import pydantic
+
 from airflow.callbacks.callback_requests import (
+    CallbackRequest,
     DagCallbackRequest,
     TaskCallbackRequest,
 )
 from airflow.configuration import conf
-from airflow.exceptions import AirflowException
-from airflow.models.dag import DAG
 from airflow.models.dagbag import DagBag
-from airflow.models.pool import Pool
-from airflow.models.serialized_dag import SerializedDagModel
-from airflow.models.taskinstance import TaskInstance, _run_finished_callback
+from airflow.sdk.execution_time.comms import GetConnection, GetVariable
+from airflow.sdk.execution_time.supervisor import WatchedSubprocess
+from airflow.serialization.serialized_objects import LazyDeserializedDAG, 
SerializedDAG
 from airflow.stats import Stats
-from airflow.utils import timezone
-from airflow.utils.file import iter_airflow_imports, might_contain_dag
-from airflow.utils.log.logging_mixin import LoggingMixin, StreamLogWriter, 
set_context
-from airflow.utils.mixins import MultiprocessingStartMethodMixin
-from airflow.utils.session import NEW_SESSION, provide_session
-from airflow.utils.state import TaskInstanceState
 
 if TYPE_CHECKING:
-    import multiprocessing
-    from datetime import datetime
-    from multiprocessing.connection import Connection as 
MultiprocessingConnection
-
-    from sqlalchemy.orm.session import Session
-
-    from airflow.callbacks.callback_requests import CallbackRequest
-    from airflow.models.operator import Operator
+    from airflow.typing_compat import Self
+    from airflow.utils.context import Context
+
+
+def _parse_file_entrypoint():
+    import os
+
+    import structlog
+
+    from airflow.sdk.execution_time import task_runner
+    # Parse DAG file, send JSON back up!
+
+    comms_decoder = task_runner.CommsDecoder[DagFileParseRequest, 
DagFileParsingResult](
+        input=sys.stdin,
+        decoder=pydantic.TypeAdapter[DagFileParseRequest](DagFileParseRequest),
+    )
+    msg = comms_decoder.get_message()
+    comms_decoder.request_socket = os.fdopen(msg.requests_fd, "wb", 
buffering=0)
+
+    log = structlog.get_logger(logger_name="task")
+
+    result = _parse_file(msg, log)
+    comms_decoder.send_request(log, result)
+
+
+def _parse_file(msg: DagFileParseRequest, log):
+    # TODO: Set known_pool names on DagBag!
+    bag = DagBag(
+        dag_folder=msg.file,
+        include_examples=False,
+        safe_mode=True,
+        load_op_links=False,
+    )
+    serialized_dags, serialization_import_errors = _serialize_dags(bag, log)
+    bag.import_errors.update(serialization_import_errors)
+    dags = [LazyDeserializedDAG(data=serdag) for serdag in serialized_dags]
+    result = DagFileParsingResult(
+        fileloc=msg.file,
+        serialized_dags=dags,
+        import_errors=bag.import_errors,
+        # TODO: Make `bag.dag_warnings` not return SQLA model objects
+        warnings=[],
+    )
+
+    if msg.callback_requests:
+        _execute_callbacks(bag, msg.callback_requests, log)
+    return result
+
+
+def _serialize_dags(bag, log):
+    serialization_import_errors = {}
+    serialized_dags = []
+    for dag in bag.dags.values():
+        try:
+            serialized_dag = SerializedDAG.to_dict(dag)
+            serialized_dags.append(serialized_dag)
+        except Exception:
+            log.exception("Failed to serialize DAG: %s", dag.fileloc)
+            dagbag_import_error_traceback_depth = conf.getint(
+                "core", "dagbag_import_error_traceback_depth", fallback=None
+            )
+            serialization_import_errors[dag.fileloc] = traceback.format_exc(
+                limit=-dagbag_import_error_traceback_depth
+            )
+    return serialized_dags, serialization_import_errors
 
 
-@dataclass
-class _QueryCounter:
-    queries_number: int = 0
+def _execute_callbacks(dagbag: DagBag, callback_requests: 
list[CallbackRequest], log):
+    for request in callback_requests:
+        log.debug("Processing Callback Request", request=request)
+        if isinstance(request, TaskCallbackRequest):
+            raise NotImplementedError("Haven't coded Task callback yet!")
+            # _execute_task_callbacks(dagbag, request)
+        elif isinstance(request, DagCallbackRequest):
+            _execute_dag_callbacks(dagbag, request, log)
 
-    def inc(self):
-        self.queries_number += 1
 
+def _execute_dag_callbacks(dagbag: DagBag, request: DagCallbackRequest, log):

Review Comment:
   ```suggestion
   def _execute_dag_callbacks(dagbag: DagBag, request: DagCallbackRequest, log) 
-> None:
   ```



##########
task_sdk/src/airflow/sdk/log.py:
##########
@@ -324,19 +324,15 @@ def configure_logging(
                 },
             },
             "loggers": {
+                # Set Airflow logging to the level requested, but most 
everything else at "INFO"

Review Comment:
   We should cover this change in the newsfragment too, but I love it.



##########
airflow/serialization/serialized_objects.py:
##########
@@ -1870,3 +1871,55 @@ def _has_kubernetes() -> bool:
     except ImportError:
         HAS_KUBERNETES = False
     return HAS_KUBERNETES
+
+
+class LazyDeserializedDAG(pydantic.BaseModel):
+    """
+    Lazily build information from the serialized DAG structure.
+
+    An object that will present "enough" of the DAG like interface to update 
DAG db models etc, without having
+    to deserialize the full DAG and Task hierarchy.
+    """
+
+    data: dict
+
+    NULLABLE_PROPERTIES: ClassVar[set[str]] = {
+        "is_paused_upon_creation",
+        "owner",
+        "dag_display_name",
+        "description",
+        "max_active_tasks",
+        "max_active_runs",
+        "max_consecutive_failed_dag_runs",
+        "owner_links",
+    }
+
+    @property
+    def hash(self) -> str:
+        from airflow.models.serialized_dag import SerializedDagModel
+
+        return SerializedDagModel.hash(self.data)
+
+    def next_dagrun_info(self, last):
+        return None
+
+    def __getattr__(self, name: str, /) -> Any:
+        if name in self.NULLABLE_PROPERTIES:
+            return self.data["dag"].get(name)
+        try:
+            return self.data["dag"][name]
+        except KeyError:
+            raise AttributeError(f"{type(self).__name__!r} object has no 
attribute {name!r}") from None
+
+    @property
+    def timetable(self):
+        return decode_timetable(self.data["dag"]["timetable"])
+
+    @property
+    def has_task_concurrency_limits(self):

Review Comment:
   ```suggestion
       def has_task_concurrency_limits(self) -> bool:
   ```



##########
airflow/dag_processing/processor.py:
##########
@@ -16,610 +16,228 @@
 # under the License.
 from __future__ import annotations
 
-import importlib
-import logging
 import os
-import signal
-import threading
-import time
-import zipfile
-from collections.abc import Generator, Iterable
-from contextlib import contextmanager, redirect_stderr, redirect_stdout, 
suppress
-from dataclasses import dataclass
-from typing import TYPE_CHECKING
-
-from setproctitle import setproctitle
-from sqlalchemy import event
-
-from airflow import settings
+import sys
+import traceback
+from collections.abc import Generator
+from typing import TYPE_CHECKING, Annotated, Callable, Literal, Union
+
+import attrs
+import pydantic
+
 from airflow.callbacks.callback_requests import (
+    CallbackRequest,
     DagCallbackRequest,
     TaskCallbackRequest,
 )
 from airflow.configuration import conf
-from airflow.exceptions import AirflowException
-from airflow.models.dag import DAG
 from airflow.models.dagbag import DagBag
-from airflow.models.pool import Pool
-from airflow.models.serialized_dag import SerializedDagModel
-from airflow.models.taskinstance import TaskInstance, _run_finished_callback
+from airflow.sdk.execution_time.comms import GetConnection, GetVariable
+from airflow.sdk.execution_time.supervisor import WatchedSubprocess
+from airflow.serialization.serialized_objects import LazyDeserializedDAG, 
SerializedDAG
 from airflow.stats import Stats
-from airflow.utils import timezone
-from airflow.utils.file import iter_airflow_imports, might_contain_dag
-from airflow.utils.log.logging_mixin import LoggingMixin, StreamLogWriter, 
set_context
-from airflow.utils.mixins import MultiprocessingStartMethodMixin
-from airflow.utils.session import NEW_SESSION, provide_session
-from airflow.utils.state import TaskInstanceState
 
 if TYPE_CHECKING:
-    import multiprocessing
-    from datetime import datetime
-    from multiprocessing.connection import Connection as 
MultiprocessingConnection
-
-    from sqlalchemy.orm.session import Session
-
-    from airflow.callbacks.callback_requests import CallbackRequest
-    from airflow.models.operator import Operator
+    from airflow.typing_compat import Self
+    from airflow.utils.context import Context
+
+
+def _parse_file_entrypoint():
+    import os
+
+    import structlog
+
+    from airflow.sdk.execution_time import task_runner
+    # Parse DAG file, send JSON back up!
+
+    comms_decoder = task_runner.CommsDecoder[DagFileParseRequest, 
DagFileParsingResult](
+        input=sys.stdin,
+        decoder=pydantic.TypeAdapter[DagFileParseRequest](DagFileParseRequest),
+    )
+    msg = comms_decoder.get_message()
+    comms_decoder.request_socket = os.fdopen(msg.requests_fd, "wb", 
buffering=0)
+
+    log = structlog.get_logger(logger_name="task")
+
+    result = _parse_file(msg, log)
+    comms_decoder.send_request(log, result)
+
+
+def _parse_file(msg: DagFileParseRequest, log):
+    # TODO: Set known_pool names on DagBag!
+    bag = DagBag(
+        dag_folder=msg.file,
+        include_examples=False,
+        safe_mode=True,
+        load_op_links=False,
+    )
+    serialized_dags, serialization_import_errors = _serialize_dags(bag, log)
+    bag.import_errors.update(serialization_import_errors)
+    dags = [LazyDeserializedDAG(data=serdag) for serdag in serialized_dags]
+    result = DagFileParsingResult(
+        fileloc=msg.file,
+        serialized_dags=dags,
+        import_errors=bag.import_errors,
+        # TODO: Make `bag.dag_warnings` not return SQLA model objects
+        warnings=[],
+    )
+
+    if msg.callback_requests:
+        _execute_callbacks(bag, msg.callback_requests, log)
+    return result
+
+
+def _serialize_dags(bag, log):
+    serialization_import_errors = {}
+    serialized_dags = []
+    for dag in bag.dags.values():
+        try:
+            serialized_dag = SerializedDAG.to_dict(dag)
+            serialized_dags.append(serialized_dag)
+        except Exception:
+            log.exception("Failed to serialize DAG: %s", dag.fileloc)
+            dagbag_import_error_traceback_depth = conf.getint(
+                "core", "dagbag_import_error_traceback_depth", fallback=None
+            )
+            serialization_import_errors[dag.fileloc] = traceback.format_exc(
+                limit=-dagbag_import_error_traceback_depth
+            )
+    return serialized_dags, serialization_import_errors
 
 
-@dataclass
-class _QueryCounter:
-    queries_number: int = 0
+def _execute_callbacks(dagbag: DagBag, callback_requests: 
list[CallbackRequest], log):
+    for request in callback_requests:
+        log.debug("Processing Callback Request", request=request)
+        if isinstance(request, TaskCallbackRequest):
+            raise NotImplementedError("Haven't coded Task callback yet!")
+            # _execute_task_callbacks(dagbag, request)
+        elif isinstance(request, DagCallbackRequest):
+            _execute_dag_callbacks(dagbag, request, log)
 
-    def inc(self):
-        self.queries_number += 1
 
+def _execute_dag_callbacks(dagbag: DagBag, request: DagCallbackRequest, log):
+    dag = dagbag.dags[request.dag_id]
 
-@contextmanager
-def count_queries(session: Session) -> Generator[_QueryCounter, None, None]:
-    # using list allows to read the updated counter from what context manager 
returns
-    counter: _QueryCounter = _QueryCounter()
+    callbacks = dag.on_failure_callback if request.is_failure_callback else 
dag.on_success_callback
+    if not callbacks:
+        log.warning("Callback requested, but dag didn't have any", 
dag_id=request.dag_id)
+        return
 
-    @event.listens_for(session, "do_orm_execute")
-    def _count_db_queries(orm_execute_state):
-        nonlocal counter
-        counter.inc()
+    callbacks = callbacks if isinstance(callbacks, list) else [callbacks]
+    # TODO:We need a proper context object!
+    context: Context = {}  # type: ignore[assignment]
 
-    yield counter
-    event.remove(session, "do_orm_execute", _count_db_queries)
+    for callback in callbacks:
+        log.info(
+            "Executing on_%s dag callback",
+            "failure" if request.is_failure_callback else "success",
+            fn=callback,
+            dag_id=request.dag_id,
+        )
+        try:
+            callback(context)
+        except Exception:
+            log.exception("Callback failed", dag_id=request.dag_id)
+            Stats.incr("dag.callback_exceptions", tags={"dag_id": 
request.dag_id})
 
 
-class DagFileProcessorProcess(LoggingMixin, MultiprocessingStartMethodMixin):
+class DagFileParseRequest(pydantic.BaseModel):
     """
-    Runs DAG processing in a separate process using DagFileProcessor.
+    Request for DAG File Parsing.
 
-    :param file_path: a Python file containing Airflow DAG definitions
-    :param callback_requests: failure callback to execute
+    This is the request that the manager will send to the DAG parser with the 
dag file and
+    any other necessary metadata.
     """
 
-    # Counter that increments every time an instance of this class is created
-    class_creation_counter = 0
-
-    def __init__(
-        self,
-        file_path: str,
-        dag_directory: str,
-        callback_requests: list[CallbackRequest],
-    ):
-        super().__init__()
-        self._file_path = file_path
-        self._dag_directory = dag_directory
-        self._callback_requests = callback_requests
-
-        # The process that was launched to process the given DAG file.
-        self._process: multiprocessing.process.BaseProcess | None = None
-        # The result of DagFileProcessor.process_file(file_path).
-        self._result: tuple[int, int, int] | None = None
-        # Whether the process is done running.
-        self._done = False
-        # When the process started.
-        self._start_time: datetime | None = None
-        # This ID is used to uniquely name the process / thread that's launched
-        # by this processor instance
-        self._instance_id = DagFileProcessorProcess.class_creation_counter
-
-        self._parent_channel: MultiprocessingConnection | None = None
-        DagFileProcessorProcess.class_creation_counter += 1
-
-    @property
-    def file_path(self) -> str:
-        return self._file_path
-
-    @staticmethod
-    def _run_file_processor(
-        result_channel: MultiprocessingConnection,
-        parent_channel: MultiprocessingConnection,
-        file_path: str,
-        thread_name: str,
-        dag_directory: str,
-        callback_requests: list[CallbackRequest],
-        known_pools: set[str] | None = None,
-    ) -> None:
-        """
-        Process the given file.
-
-        :param result_channel: the connection to use for passing back the 
result
-        :param parent_channel: the parent end of the channel to close in the 
child
-        :param file_path: the file to process
-        :param thread_name: the name to use for the process that is launched
-        :param callback_requests: failure callback to execute
-        :return: the process that was launched
-        """
-        # This helper runs in the newly created process
-        log: logging.Logger = logging.getLogger("airflow.processor")
-
-        # Since we share all open FDs from the parent, we need to close the 
parent side of the pipe here in
-        # the child, else it won't get closed properly until we exit.
-        parent_channel.close()
-        del parent_channel
-
-        set_context(log, file_path)
-        setproctitle(f"airflow scheduler - DagFileProcessor {file_path}")
-
-        def _handle_dag_file_processing():
-            # Re-configure the ORM engine as there are issues with multiple 
processes
-            settings.configure_orm()
-
-            # Change the thread name to differentiate log lines. This is
-            # really a separate process, but changing the name of the
-            # process doesn't work, so changing the thread name instead.
-            threading.current_thread().name = thread_name
-
-            log.info("Started process (PID=%s) to work on %s", os.getpid(), 
file_path)
-            dag_file_processor = DagFileProcessor(dag_directory=dag_directory, 
log=log)
-            result: tuple[int, int, int] = dag_file_processor.process_file(
-                file_path=file_path,
-                callback_requests=callback_requests,
-                known_pools=known_pools,
-            )
-            result_channel.send(result)
-
-        try:
-            DAG_PROCESSOR_LOG_TARGET = conf.get_mandatory_value("logging", 
"DAG_PROCESSOR_LOG_TARGET")
-            if DAG_PROCESSOR_LOG_TARGET == "stdout":
-                with Stats.timer() as timer:
-                    _handle_dag_file_processing()
-            else:
-                # The following line ensures that stdout goes to the same 
destination as the logs. If stdout
-                # gets sent to logs and logs are sent to stdout, this leads to 
an infinite loop. This
-                # necessitates this conditional based on the value of 
DAG_PROCESSOR_LOG_TARGET.
-                with (
-                    redirect_stdout(StreamLogWriter(log, logging.INFO)),
-                    redirect_stderr(StreamLogWriter(log, logging.WARNING)),
-                    Stats.timer() as timer,
-                ):
-                    _handle_dag_file_processing()
-            log.info("Processing %s took %.3f seconds", file_path, 
timer.duration)
-        except Exception:
-            # Log exceptions through the logging framework.
-            log.exception("Got an exception! Propagating...")
-            raise
-        finally:
-            # We re-initialized the ORM within this Process above so we need to
-            # tear it down manually here
-            settings.dispose_orm()
-
-            result_channel.close()
-
-    def start(self) -> None:
-        """Launch the process and start processing the DAG."""
-        if conf.getboolean("scheduler", "parsing_pre_import_modules", 
fallback=True):
-            # Read the file to pre-import airflow modules used.
-            # This prevents them from being re-imported from zero in each 
"processing" process
-            # and saves CPU time and memory.
-            zip_file_paths = []
-            if zipfile.is_zipfile(self.file_path):
-                try:
-                    with zipfile.ZipFile(self.file_path) as z:
-                        zip_file_paths.extend(
-                            [
-                                os.path.join(self.file_path, info.filename)
-                                for info in z.infolist()
-                                if might_contain_dag(info.filename, True, z)
-                            ]
-                        )
-                except zipfile.BadZipFile as err:
-                    self.log.error("There was an err accessing %s, %s", 
self.file_path, err)
-            if zip_file_paths:
-                self.import_modules(zip_file_paths)
-            else:
-                self.import_modules(self.file_path)
-
-        context = self._get_multiprocessing_context()
-
-        pool_names = {p.pool for p in Pool.get_pools()}
-
-        _parent_channel, _child_channel = context.Pipe(duplex=False)
-        process = context.Process(
-            target=type(self)._run_file_processor,
-            args=(
-                _child_channel,
-                _parent_channel,
-                self.file_path,
-                f"DagFileProcessor{self._instance_id}",
-                self._dag_directory,
-                self._callback_requests,
-                pool_names,
-            ),
-            name=f"DagFileProcessor{self._instance_id}-Process",
-        )
-        self._process = process
-        self._start_time = timezone.utcnow()
-        process.start()
-
-        # Close the child side of the pipe now the subprocess has started -- 
otherwise this would prevent it
-        # from closing in some cases
-        _child_channel.close()
-        del _child_channel
-
-        # Don't store it on self until after we've started the child process - 
we don't want to keep it from
-        # getting GCd/closed
-        self._parent_channel = _parent_channel
-
-    def kill(self) -> None:
-        """Kill the process launched to process the file, and ensure 
consistent state."""
-        if self._process is None:
-            raise AirflowException("Tried to kill before starting!")
-        self._kill_process()
-
-    def terminate(self, sigkill: bool = False) -> None:
-        """
-        Terminate (and then kill) the process launched to process the file.
-
-        :param sigkill: whether to issue a SIGKILL if SIGTERM doesn't work.
-        """
-        if self._process is None or self._parent_channel is None:
-            raise AirflowException("Tried to call terminate before starting!")
-
-        self._process.terminate()
-        # Arbitrarily wait 5s for the process to die
-        with suppress(TimeoutError):
-            self._process._popen.wait(5)  # type: ignore
-        if sigkill:
-            self._kill_process()
-        self._parent_channel.close()
-
-    def _kill_process(self) -> None:
-        if self._process is None:
-            raise AirflowException("Tried to kill process before starting!")
-
-        if self._process.is_alive() and self._process.pid:
-            self.log.warning("Killing DAGFileProcessorProcess (PID=%d)", 
self._process.pid)
-            os.kill(self._process.pid, signal.SIGKILL)
-
-            # Reap the spawned zombie. We active wait, because in Python 3.9 
`waitpid` might lead to an
-            # exception, due to change in Python standard library and 
possibility of race condition
-            # see https://bugs.python.org/issue42558
-            while self._process._popen.poll() is None:  # type: ignore
-                time.sleep(0.001)
-        if self._parent_channel:
-            self._parent_channel.close()
+    file: str
+    requests_fd: int
+    callback_requests: list[CallbackRequest] = 
pydantic.Field(default_factory=list)
+    type: Literal["DagFileParseRequest"] = "DagFileParseRequest"
 
-    @property
-    def pid(self) -> int:
-        """PID of the process launched to process the given file."""
-        if self._process is None or self._process.pid is None:
-            raise AirflowException("Tried to get PID before starting!")
-        return self._process.pid
 
-    @property
-    def exit_code(self) -> int | None:
-        """
-        After the process is finished, this can be called to get the return 
code.
+class DagFileParsingResult(pydantic.BaseModel):
+    """
+    Result of DAG File Parsing.
 
-        :return: the exit code of the process
-        """
-        if self._process is None:
-            raise AirflowException("Tried to get exit code before starting!")
-        if not self._done:
-            raise AirflowException("Tried to call retcode before process was 
finished!")
-        return self._process.exitcode
+    This is the result of a successful DAG parse, in this class, we gather all 
serialized DAGs,
+    import errors and warnings to send back to the scheduler to store in the 
DB.
+    """
 
-    @property
-    def done(self) -> bool:
-        """
-        Check if the process launched to process this file is done.
+    fileloc: str
+    serialized_dags: list[LazyDeserializedDAG]
+    warnings: list | None = None
+    import_errors: dict[str, str] | None = None
+    type: Literal["DagFileParsingResult"] = "DagFileParsingResult"
 
-        :return: whether the process is finished running
-        """
-        if self._process is None or self._parent_channel is None:
-            raise AirflowException("Tried to see if it's done before 
starting!")
 
-        if self._done:
-            return True
+ToParent = Annotated[
+    Union[DagFileParsingResult, GetConnection, GetVariable],
+    pydantic.Field(discriminator="type"),
+]
 
-        if self._parent_channel.poll():
-            try:
-                self._result = self._parent_channel.recv()
-                self._done = True
-                self.log.debug("Waiting for %s", self._process)
-                self._process.join()
-                self._parent_channel.close()
-                return True
-            except EOFError:
-                # If we get an EOFError, it means the child end of the pipe 
has been closed. This only happens
-                # in the finally block. But due to a possible race condition, 
the process may have not yet
-                # terminated (it could be doing cleanup/python shutdown 
still). So we kill it here after a
-                # "suitable" timeout.
-                self._done = True
-                # Arbitrary timeout -- error/race condition only, so this 
doesn't need to be tunable.
-                self._process.join(timeout=5)
-                if self._process.is_alive():
-                    # Didn't shut down cleanly - kill it
-                    self._kill_process()
-
-        if not self._process.is_alive():
-            self._done = True
-            self.log.debug("Waiting for %s", self._process)
-            self._process.join()
-            self._parent_channel.close()
-            return True
-
-        return False
 
-    @property
-    def result(self) -> tuple[int, int, int] | None:
-        """Result of running ``DagFileProcessor.process_file()``."""
-        if not self.done:
-            raise AirflowException("Tried to get the result before it's done!")
-        return self._result
-
-    @property
-    def start_time(self) -> datetime:
-        """Time when this started to process the file."""
-        if self._start_time is None:
-            raise AirflowException("Tried to get start time before it 
started!")
-        return self._start_time
-
-    @property
-    def waitable_handle(self):
-        return self._process.sentinel
-
-    def import_modules(self, file_path: str | Iterable[str]):
-        def _import_modules(filepath):
-            for module in iter_airflow_imports(filepath):
-                try:
-                    importlib.import_module(module)
-                except Exception as e:
-                    # only log as warning because an error here is not 
preventing anything from working, and
-                    # if it's serious, it's going to be surfaced to the user 
when the dag is actually parsed.
-                    self.log.warning(
-                        "Error when trying to pre-import module '%s' found in 
%s: %s",
-                        module,
-                        file_path,
-                        e,
-                    )
-
-        if isinstance(file_path, str):
-            _import_modules(file_path)
-        elif isinstance(file_path, Iterable):
-            for path in file_path:
-                _import_modules(path)
-
-
-class DagFileProcessor(LoggingMixin):
[email protected]()
+class DagFileProcessorProcess(WatchedSubprocess):
     """
-    Process a Python file containing Airflow DAGs.
-
-    This includes:
-
-    1. Execute the file and look for DAG objects in the namespace.
-    2. Execute any Callbacks if passed to DagFileProcessor.process_file
-    3. Serialize the DAGs and save it to DB (or update existing record in the 
DB).
-    4. Record any errors importing the file into ORM
+    Parses dags with Task SDK API.
 
-    Returns a tuple of 'number of dags found' and 'the count of import errors'
-
-    :param log: Logger to save the processing process
+    Since DAGs are written with the Task SDK, we need to parse them in a task 
SDK process such that
+    we can use the Task SDK definitions when serializing. This prevents 
potential conflicts with classes
+    in core Airflow.
     """
 
-    UNIT_TEST_MODE: bool = conf.getboolean("core", "UNIT_TEST_MODE")
-
-    def __init__(self, dag_directory: str, log: logging.Logger):
-        super().__init__()
-        self._log = log
-        self._dag_directory = dag_directory
-        self._last_num_of_db_queries = 0
+    parsing_result: DagFileParsingResult | None = None
 
     @classmethod
-    @provide_session
-    def execute_callbacks(
+    def start(  # type: ignore[override]
         cls,
-        dagbag: DagBag,
-        callback_requests: list[CallbackRequest],
-        unit_test_mode: bool,
-        session: Session = NEW_SESSION,
-    ) -> None:
-        """
-        Execute on failure callbacks.
-
-        These objects can come from SchedulerJobRunner or from 
DagProcessorJobRunner.
-
-        :param dagbag: Dag Bag of dags
-        :param callback_requests: failure callbacks to execute
-        :param session: DB session.
-
-        :return: number of queries executed
-        """
-        for request in callback_requests:
-            cls.logger().debug("Processing Callback Request: %s", request)
-            try:
-                if isinstance(request, TaskCallbackRequest):
-                    cls._execute_task_callbacks(dagbag, request, 
unit_test_mode, session=session)
-                elif isinstance(request, DagCallbackRequest):
-                    cls._execute_dag_callbacks(dagbag, request, 
session=session)
-            except Exception:
-                cls.logger().exception(
-                    "Error executing %s callback for file: %s",
-                    request.__class__.__name__,
-                    request.full_filepath,
-                )
-        session.flush()
-        session.commit()
+        path: str | os.PathLike[str],
+        callbacks: list[CallbackRequest],
+        target: Callable[[], None] = _parse_file_entrypoint,
+        **kwargs,
+    ) -> Self:
+        return super().start(path, callbacks, target=target, client=None, 
**kwargs)  # type:ignore[arg-type]
+
+    def _on_child_started(  # type: ignore[override]
+        self, callbacks: list[CallbackRequest], path: str | os.PathLike[str], 
child_comms_fd: int
+    ):
+        msg = DagFileParseRequest(
+            file=os.fspath(path),
+            requests_fd=child_comms_fd,
+            callback_requests=callbacks,
+        )
+        self.stdin.write(msg.model_dump_json().encode() + b"\n")
 
-    @classmethod
-    @provide_session
-    def execute_callbacks_without_dag(
-        cls, callback_requests: list[CallbackRequest], unit_test_mode: bool, 
session: Session = NEW_SESSION
-    ) -> None:
-        """
-        Execute what callbacks we can as "best effort" when the dag cannot be 
found/had parse errors.
-
-        This is so important so that tasks that failed when there is a parse
-        error don't get stuck in queued state.
-        """
-        for request in callback_requests:
-            cls.logger().debug("Processing Callback Request: %s", request)
-            if isinstance(request, TaskCallbackRequest):
-                cls._execute_task_callbacks(None, request, unit_test_mode, 
session)
-            else:
-                cls.logger().info(
-                    "Not executing %s callback for file %s as there was a dag 
parse error",
-                    request.__class__.__name__,
-                    request.full_filepath,
-                )
-        session.flush()
-        session.commit()
+    def handle_requests(self, log) -> Generator[None, bytes, None]:

Review Comment:
   ```suggestion
       def handle_requests(self, log: FilteringBoundLogger) -> Generator[None, 
bytes, None]:
   ```



##########
airflow/serialization/serialized_objects.py:
##########
@@ -1870,3 +1871,55 @@ def _has_kubernetes() -> bool:
     except ImportError:
         HAS_KUBERNETES = False
     return HAS_KUBERNETES
+
+
+class LazyDeserializedDAG(pydantic.BaseModel):
+    """
+    Lazily build information from the serialized DAG structure.
+
+    An object that will present "enough" of the DAG like interface to update 
DAG db models etc, without having
+    to deserialize the full DAG and Task hierarchy.
+    """
+
+    data: dict
+
+    NULLABLE_PROPERTIES: ClassVar[set[str]] = {
+        "is_paused_upon_creation",
+        "owner",
+        "dag_display_name",
+        "description",
+        "max_active_tasks",
+        "max_active_runs",
+        "max_consecutive_failed_dag_runs",
+        "owner_links",
+    }
+
+    @property
+    def hash(self) -> str:
+        from airflow.models.serialized_dag import SerializedDagModel
+
+        return SerializedDagModel.hash(self.data)
+
+    def next_dagrun_info(self, last):

Review Comment:
   ```suggestion
       def next_dagrun_info(self, last) -> None:
   ```



##########
airflow/serialization/serialized_objects.py:
##########
@@ -1870,3 +1871,55 @@ def _has_kubernetes() -> bool:
     except ImportError:
         HAS_KUBERNETES = False
     return HAS_KUBERNETES
+
+
+class LazyDeserializedDAG(pydantic.BaseModel):
+    """
+    Lazily build information from the serialized DAG structure.
+
+    An object that will present "enough" of the DAG like interface to update 
DAG db models etc, without having
+    to deserialize the full DAG and Task hierarchy.
+    """
+
+    data: dict
+
+    NULLABLE_PROPERTIES: ClassVar[set[str]] = {
+        "is_paused_upon_creation",
+        "owner",
+        "dag_display_name",
+        "description",
+        "max_active_tasks",
+        "max_active_runs",
+        "max_consecutive_failed_dag_runs",
+        "owner_links",
+    }
+
+    @property
+    def hash(self) -> str:
+        from airflow.models.serialized_dag import SerializedDagModel
+
+        return SerializedDagModel.hash(self.data)
+
+    def next_dagrun_info(self, last):
+        return None
+
+    def __getattr__(self, name: str, /) -> Any:
+        if name in self.NULLABLE_PROPERTIES:
+            return self.data["dag"].get(name)
+        try:
+            return self.data["dag"][name]
+        except KeyError:
+            raise AttributeError(f"{type(self).__name__!r} object has no 
attribute {name!r}") from None
+
+    @property
+    def timetable(self):

Review Comment:
   ```suggestion
       def timetable(self) -> Timetable:
   ```



##########
airflow/dag_processing/processor.py:
##########
@@ -16,610 +16,228 @@
 # under the License.
 from __future__ import annotations
 
-import importlib
-import logging
 import os
-import signal
-import threading
-import time
-import zipfile
-from collections.abc import Generator, Iterable
-from contextlib import contextmanager, redirect_stderr, redirect_stdout, 
suppress
-from dataclasses import dataclass
-from typing import TYPE_CHECKING
-
-from setproctitle import setproctitle
-from sqlalchemy import event
-
-from airflow import settings
+import sys
+import traceback
+from collections.abc import Generator
+from typing import TYPE_CHECKING, Annotated, Callable, Literal, Union
+
+import attrs
+import pydantic
+
 from airflow.callbacks.callback_requests import (
+    CallbackRequest,
     DagCallbackRequest,
     TaskCallbackRequest,
 )
 from airflow.configuration import conf
-from airflow.exceptions import AirflowException
-from airflow.models.dag import DAG
 from airflow.models.dagbag import DagBag
-from airflow.models.pool import Pool
-from airflow.models.serialized_dag import SerializedDagModel
-from airflow.models.taskinstance import TaskInstance, _run_finished_callback
+from airflow.sdk.execution_time.comms import GetConnection, GetVariable
+from airflow.sdk.execution_time.supervisor import WatchedSubprocess
+from airflow.serialization.serialized_objects import LazyDeserializedDAG, 
SerializedDAG
 from airflow.stats import Stats
-from airflow.utils import timezone
-from airflow.utils.file import iter_airflow_imports, might_contain_dag
-from airflow.utils.log.logging_mixin import LoggingMixin, StreamLogWriter, 
set_context
-from airflow.utils.mixins import MultiprocessingStartMethodMixin
-from airflow.utils.session import NEW_SESSION, provide_session
-from airflow.utils.state import TaskInstanceState
 
 if TYPE_CHECKING:
-    import multiprocessing
-    from datetime import datetime
-    from multiprocessing.connection import Connection as 
MultiprocessingConnection
-
-    from sqlalchemy.orm.session import Session
-
-    from airflow.callbacks.callback_requests import CallbackRequest
-    from airflow.models.operator import Operator
+    from airflow.typing_compat import Self
+    from airflow.utils.context import Context
+
+
+def _parse_file_entrypoint():
+    import os
+
+    import structlog
+
+    from airflow.sdk.execution_time import task_runner
+    # Parse DAG file, send JSON back up!
+
+    comms_decoder = task_runner.CommsDecoder[DagFileParseRequest, 
DagFileParsingResult](
+        input=sys.stdin,
+        decoder=pydantic.TypeAdapter[DagFileParseRequest](DagFileParseRequest),
+    )
+    msg = comms_decoder.get_message()
+    comms_decoder.request_socket = os.fdopen(msg.requests_fd, "wb", 
buffering=0)
+
+    log = structlog.get_logger(logger_name="task")
+
+    result = _parse_file(msg, log)
+    comms_decoder.send_request(log, result)
+
+
+def _parse_file(msg: DagFileParseRequest, log):
+    # TODO: Set known_pool names on DagBag!
+    bag = DagBag(
+        dag_folder=msg.file,
+        include_examples=False,
+        safe_mode=True,
+        load_op_links=False,
+    )
+    serialized_dags, serialization_import_errors = _serialize_dags(bag, log)
+    bag.import_errors.update(serialization_import_errors)
+    dags = [LazyDeserializedDAG(data=serdag) for serdag in serialized_dags]
+    result = DagFileParsingResult(
+        fileloc=msg.file,
+        serialized_dags=dags,
+        import_errors=bag.import_errors,
+        # TODO: Make `bag.dag_warnings` not return SQLA model objects
+        warnings=[],
+    )
+
+    if msg.callback_requests:
+        _execute_callbacks(bag, msg.callback_requests, log)
+    return result
+
+
+def _serialize_dags(bag, log):

Review Comment:
   ```suggestion
   def _serialize_dags(bag: DagBag, log: FilteringBoundLogger) -> 
tuple[list[SerializedDAG], str]]:
   ```



##########
airflow/dag_processing/processor.py:
##########
@@ -16,610 +16,228 @@
 # under the License.
 from __future__ import annotations
 
-import importlib
-import logging
 import os
-import signal
-import threading
-import time
-import zipfile
-from collections.abc import Generator, Iterable
-from contextlib import contextmanager, redirect_stderr, redirect_stdout, 
suppress
-from dataclasses import dataclass
-from typing import TYPE_CHECKING
-
-from setproctitle import setproctitle
-from sqlalchemy import event
-
-from airflow import settings
+import sys
+import traceback
+from collections.abc import Generator
+from typing import TYPE_CHECKING, Annotated, Callable, Literal, Union
+
+import attrs
+import pydantic
+
 from airflow.callbacks.callback_requests import (
+    CallbackRequest,
     DagCallbackRequest,
     TaskCallbackRequest,
 )
 from airflow.configuration import conf
-from airflow.exceptions import AirflowException
-from airflow.models.dag import DAG
 from airflow.models.dagbag import DagBag
-from airflow.models.pool import Pool
-from airflow.models.serialized_dag import SerializedDagModel
-from airflow.models.taskinstance import TaskInstance, _run_finished_callback
+from airflow.sdk.execution_time.comms import GetConnection, GetVariable
+from airflow.sdk.execution_time.supervisor import WatchedSubprocess
+from airflow.serialization.serialized_objects import LazyDeserializedDAG, 
SerializedDAG
 from airflow.stats import Stats
-from airflow.utils import timezone
-from airflow.utils.file import iter_airflow_imports, might_contain_dag
-from airflow.utils.log.logging_mixin import LoggingMixin, StreamLogWriter, 
set_context
-from airflow.utils.mixins import MultiprocessingStartMethodMixin
-from airflow.utils.session import NEW_SESSION, provide_session
-from airflow.utils.state import TaskInstanceState
 
 if TYPE_CHECKING:
-    import multiprocessing
-    from datetime import datetime
-    from multiprocessing.connection import Connection as 
MultiprocessingConnection
-
-    from sqlalchemy.orm.session import Session
-
-    from airflow.callbacks.callback_requests import CallbackRequest
-    from airflow.models.operator import Operator
+    from airflow.typing_compat import Self
+    from airflow.utils.context import Context
+
+
+def _parse_file_entrypoint():
+    import os
+
+    import structlog
+
+    from airflow.sdk.execution_time import task_runner
+    # Parse DAG file, send JSON back up!
+
+    comms_decoder = task_runner.CommsDecoder[DagFileParseRequest, 
DagFileParsingResult](
+        input=sys.stdin,
+        decoder=pydantic.TypeAdapter[DagFileParseRequest](DagFileParseRequest),
+    )
+    msg = comms_decoder.get_message()
+    comms_decoder.request_socket = os.fdopen(msg.requests_fd, "wb", 
buffering=0)
+
+    log = structlog.get_logger(logger_name="task")
+
+    result = _parse_file(msg, log)
+    comms_decoder.send_request(log, result)
+
+
+def _parse_file(msg: DagFileParseRequest, log):
+    # TODO: Set known_pool names on DagBag!
+    bag = DagBag(
+        dag_folder=msg.file,
+        include_examples=False,
+        safe_mode=True,
+        load_op_links=False,
+    )
+    serialized_dags, serialization_import_errors = _serialize_dags(bag, log)
+    bag.import_errors.update(serialization_import_errors)
+    dags = [LazyDeserializedDAG(data=serdag) for serdag in serialized_dags]
+    result = DagFileParsingResult(
+        fileloc=msg.file,
+        serialized_dags=dags,
+        import_errors=bag.import_errors,
+        # TODO: Make `bag.dag_warnings` not return SQLA model objects
+        warnings=[],
+    )
+
+    if msg.callback_requests:
+        _execute_callbacks(bag, msg.callback_requests, log)
+    return result
+
+
+def _serialize_dags(bag, log):
+    serialization_import_errors = {}
+    serialized_dags = []
+    for dag in bag.dags.values():
+        try:
+            serialized_dag = SerializedDAG.to_dict(dag)
+            serialized_dags.append(serialized_dag)
+        except Exception:
+            log.exception("Failed to serialize DAG: %s", dag.fileloc)
+            dagbag_import_error_traceback_depth = conf.getint(
+                "core", "dagbag_import_error_traceback_depth", fallback=None
+            )
+            serialization_import_errors[dag.fileloc] = traceback.format_exc(
+                limit=-dagbag_import_error_traceback_depth
+            )
+    return serialized_dags, serialization_import_errors
 
 
-@dataclass
-class _QueryCounter:
-    queries_number: int = 0
+def _execute_callbacks(dagbag: DagBag, callback_requests: 
list[CallbackRequest], log):
+    for request in callback_requests:
+        log.debug("Processing Callback Request", request=request)
+        if isinstance(request, TaskCallbackRequest):
+            raise NotImplementedError("Haven't coded Task callback yet!")
+            # _execute_task_callbacks(dagbag, request)
+        elif isinstance(request, DagCallbackRequest):
+            _execute_dag_callbacks(dagbag, request, log)
 
-    def inc(self):
-        self.queries_number += 1
 
+def _execute_dag_callbacks(dagbag: DagBag, request: DagCallbackRequest, log):
+    dag = dagbag.dags[request.dag_id]
 
-@contextmanager
-def count_queries(session: Session) -> Generator[_QueryCounter, None, None]:
-    # using list allows to read the updated counter from what context manager 
returns
-    counter: _QueryCounter = _QueryCounter()
+    callbacks = dag.on_failure_callback if request.is_failure_callback else 
dag.on_success_callback
+    if not callbacks:
+        log.warning("Callback requested, but dag didn't have any", 
dag_id=request.dag_id)
+        return
 
-    @event.listens_for(session, "do_orm_execute")
-    def _count_db_queries(orm_execute_state):
-        nonlocal counter
-        counter.inc()
+    callbacks = callbacks if isinstance(callbacks, list) else [callbacks]
+    # TODO:We need a proper context object!
+    context: Context = {}  # type: ignore[assignment]
 
-    yield counter
-    event.remove(session, "do_orm_execute", _count_db_queries)
+    for callback in callbacks:
+        log.info(
+            "Executing on_%s dag callback",
+            "failure" if request.is_failure_callback else "success",
+            fn=callback,
+            dag_id=request.dag_id,
+        )
+        try:
+            callback(context)
+        except Exception:
+            log.exception("Callback failed", dag_id=request.dag_id)
+            Stats.incr("dag.callback_exceptions", tags={"dag_id": 
request.dag_id})
 
 
-class DagFileProcessorProcess(LoggingMixin, MultiprocessingStartMethodMixin):
+class DagFileParseRequest(pydantic.BaseModel):
     """
-    Runs DAG processing in a separate process using DagFileProcessor.
+    Request for DAG File Parsing.
 
-    :param file_path: a Python file containing Airflow DAG definitions
-    :param callback_requests: failure callback to execute
+    This is the request that the manager will send to the DAG parser with the 
dag file and
+    any other necessary metadata.
     """
 
-    # Counter that increments every time an instance of this class is created
-    class_creation_counter = 0
-
-    def __init__(
-        self,
-        file_path: str,
-        dag_directory: str,
-        callback_requests: list[CallbackRequest],
-    ):
-        super().__init__()
-        self._file_path = file_path
-        self._dag_directory = dag_directory
-        self._callback_requests = callback_requests
-
-        # The process that was launched to process the given DAG file.
-        self._process: multiprocessing.process.BaseProcess | None = None
-        # The result of DagFileProcessor.process_file(file_path).
-        self._result: tuple[int, int, int] | None = None
-        # Whether the process is done running.
-        self._done = False
-        # When the process started.
-        self._start_time: datetime | None = None
-        # This ID is used to uniquely name the process / thread that's launched
-        # by this processor instance
-        self._instance_id = DagFileProcessorProcess.class_creation_counter
-
-        self._parent_channel: MultiprocessingConnection | None = None
-        DagFileProcessorProcess.class_creation_counter += 1
-
-    @property
-    def file_path(self) -> str:
-        return self._file_path
-
-    @staticmethod
-    def _run_file_processor(
-        result_channel: MultiprocessingConnection,
-        parent_channel: MultiprocessingConnection,
-        file_path: str,
-        thread_name: str,
-        dag_directory: str,
-        callback_requests: list[CallbackRequest],
-        known_pools: set[str] | None = None,
-    ) -> None:
-        """
-        Process the given file.
-
-        :param result_channel: the connection to use for passing back the 
result
-        :param parent_channel: the parent end of the channel to close in the 
child
-        :param file_path: the file to process
-        :param thread_name: the name to use for the process that is launched
-        :param callback_requests: failure callback to execute
-        :return: the process that was launched
-        """
-        # This helper runs in the newly created process
-        log: logging.Logger = logging.getLogger("airflow.processor")
-
-        # Since we share all open FDs from the parent, we need to close the 
parent side of the pipe here in
-        # the child, else it won't get closed properly until we exit.
-        parent_channel.close()
-        del parent_channel
-
-        set_context(log, file_path)
-        setproctitle(f"airflow scheduler - DagFileProcessor {file_path}")
-
-        def _handle_dag_file_processing():
-            # Re-configure the ORM engine as there are issues with multiple 
processes
-            settings.configure_orm()
-
-            # Change the thread name to differentiate log lines. This is
-            # really a separate process, but changing the name of the
-            # process doesn't work, so changing the thread name instead.
-            threading.current_thread().name = thread_name
-
-            log.info("Started process (PID=%s) to work on %s", os.getpid(), 
file_path)
-            dag_file_processor = DagFileProcessor(dag_directory=dag_directory, 
log=log)
-            result: tuple[int, int, int] = dag_file_processor.process_file(
-                file_path=file_path,
-                callback_requests=callback_requests,
-                known_pools=known_pools,
-            )
-            result_channel.send(result)
-
-        try:
-            DAG_PROCESSOR_LOG_TARGET = conf.get_mandatory_value("logging", 
"DAG_PROCESSOR_LOG_TARGET")
-            if DAG_PROCESSOR_LOG_TARGET == "stdout":
-                with Stats.timer() as timer:
-                    _handle_dag_file_processing()
-            else:
-                # The following line ensures that stdout goes to the same 
destination as the logs. If stdout
-                # gets sent to logs and logs are sent to stdout, this leads to 
an infinite loop. This
-                # necessitates this conditional based on the value of 
DAG_PROCESSOR_LOG_TARGET.
-                with (
-                    redirect_stdout(StreamLogWriter(log, logging.INFO)),
-                    redirect_stderr(StreamLogWriter(log, logging.WARNING)),
-                    Stats.timer() as timer,
-                ):
-                    _handle_dag_file_processing()
-            log.info("Processing %s took %.3f seconds", file_path, 
timer.duration)
-        except Exception:
-            # Log exceptions through the logging framework.
-            log.exception("Got an exception! Propagating...")
-            raise
-        finally:
-            # We re-initialized the ORM within this Process above so we need to
-            # tear it down manually here
-            settings.dispose_orm()
-
-            result_channel.close()
-
-    def start(self) -> None:
-        """Launch the process and start processing the DAG."""
-        if conf.getboolean("scheduler", "parsing_pre_import_modules", 
fallback=True):
-            # Read the file to pre-import airflow modules used.
-            # This prevents them from being re-imported from zero in each 
"processing" process
-            # and saves CPU time and memory.
-            zip_file_paths = []
-            if zipfile.is_zipfile(self.file_path):
-                try:
-                    with zipfile.ZipFile(self.file_path) as z:
-                        zip_file_paths.extend(
-                            [
-                                os.path.join(self.file_path, info.filename)
-                                for info in z.infolist()
-                                if might_contain_dag(info.filename, True, z)
-                            ]
-                        )
-                except zipfile.BadZipFile as err:
-                    self.log.error("There was an err accessing %s, %s", 
self.file_path, err)
-            if zip_file_paths:
-                self.import_modules(zip_file_paths)
-            else:
-                self.import_modules(self.file_path)
-
-        context = self._get_multiprocessing_context()
-
-        pool_names = {p.pool for p in Pool.get_pools()}
-
-        _parent_channel, _child_channel = context.Pipe(duplex=False)
-        process = context.Process(
-            target=type(self)._run_file_processor,
-            args=(
-                _child_channel,
-                _parent_channel,
-                self.file_path,
-                f"DagFileProcessor{self._instance_id}",
-                self._dag_directory,
-                self._callback_requests,
-                pool_names,
-            ),
-            name=f"DagFileProcessor{self._instance_id}-Process",
-        )
-        self._process = process
-        self._start_time = timezone.utcnow()
-        process.start()
-
-        # Close the child side of the pipe now the subprocess has started -- 
otherwise this would prevent it
-        # from closing in some cases
-        _child_channel.close()
-        del _child_channel
-
-        # Don't store it on self until after we've started the child process - 
we don't want to keep it from
-        # getting GCd/closed
-        self._parent_channel = _parent_channel
-
-    def kill(self) -> None:
-        """Kill the process launched to process the file, and ensure 
consistent state."""
-        if self._process is None:
-            raise AirflowException("Tried to kill before starting!")
-        self._kill_process()
-
-    def terminate(self, sigkill: bool = False) -> None:
-        """
-        Terminate (and then kill) the process launched to process the file.
-
-        :param sigkill: whether to issue a SIGKILL if SIGTERM doesn't work.
-        """
-        if self._process is None or self._parent_channel is None:
-            raise AirflowException("Tried to call terminate before starting!")
-
-        self._process.terminate()
-        # Arbitrarily wait 5s for the process to die
-        with suppress(TimeoutError):
-            self._process._popen.wait(5)  # type: ignore
-        if sigkill:
-            self._kill_process()
-        self._parent_channel.close()
-
-    def _kill_process(self) -> None:
-        if self._process is None:
-            raise AirflowException("Tried to kill process before starting!")
-
-        if self._process.is_alive() and self._process.pid:
-            self.log.warning("Killing DAGFileProcessorProcess (PID=%d)", 
self._process.pid)
-            os.kill(self._process.pid, signal.SIGKILL)
-
-            # Reap the spawned zombie. We active wait, because in Python 3.9 
`waitpid` might lead to an
-            # exception, due to change in Python standard library and 
possibility of race condition
-            # see https://bugs.python.org/issue42558
-            while self._process._popen.poll() is None:  # type: ignore
-                time.sleep(0.001)
-        if self._parent_channel:
-            self._parent_channel.close()
+    file: str
+    requests_fd: int
+    callback_requests: list[CallbackRequest] = 
pydantic.Field(default_factory=list)
+    type: Literal["DagFileParseRequest"] = "DagFileParseRequest"
 
-    @property
-    def pid(self) -> int:
-        """PID of the process launched to process the given file."""
-        if self._process is None or self._process.pid is None:
-            raise AirflowException("Tried to get PID before starting!")
-        return self._process.pid
 
-    @property
-    def exit_code(self) -> int | None:
-        """
-        After the process is finished, this can be called to get the return 
code.
+class DagFileParsingResult(pydantic.BaseModel):
+    """
+    Result of DAG File Parsing.
 
-        :return: the exit code of the process
-        """
-        if self._process is None:
-            raise AirflowException("Tried to get exit code before starting!")
-        if not self._done:
-            raise AirflowException("Tried to call retcode before process was 
finished!")
-        return self._process.exitcode
+    This is the result of a successful DAG parse, in this class, we gather all 
serialized DAGs,
+    import errors and warnings to send back to the scheduler to store in the 
DB.
+    """
 
-    @property
-    def done(self) -> bool:
-        """
-        Check if the process launched to process this file is done.
+    fileloc: str
+    serialized_dags: list[LazyDeserializedDAG]
+    warnings: list | None = None
+    import_errors: dict[str, str] | None = None
+    type: Literal["DagFileParsingResult"] = "DagFileParsingResult"
 
-        :return: whether the process is finished running
-        """
-        if self._process is None or self._parent_channel is None:
-            raise AirflowException("Tried to see if it's done before 
starting!")
 
-        if self._done:
-            return True
+ToParent = Annotated[
+    Union[DagFileParsingResult, GetConnection, GetVariable],
+    pydantic.Field(discriminator="type"),
+]
 
-        if self._parent_channel.poll():
-            try:
-                self._result = self._parent_channel.recv()
-                self._done = True
-                self.log.debug("Waiting for %s", self._process)
-                self._process.join()
-                self._parent_channel.close()
-                return True
-            except EOFError:
-                # If we get an EOFError, it means the child end of the pipe 
has been closed. This only happens
-                # in the finally block. But due to a possible race condition, 
the process may have not yet
-                # terminated (it could be doing cleanup/python shutdown 
still). So we kill it here after a
-                # "suitable" timeout.
-                self._done = True
-                # Arbitrary timeout -- error/race condition only, so this 
doesn't need to be tunable.
-                self._process.join(timeout=5)
-                if self._process.is_alive():
-                    # Didn't shut down cleanly - kill it
-                    self._kill_process()
-
-        if not self._process.is_alive():
-            self._done = True
-            self.log.debug("Waiting for %s", self._process)
-            self._process.join()
-            self._parent_channel.close()
-            return True
-
-        return False
 
-    @property
-    def result(self) -> tuple[int, int, int] | None:
-        """Result of running ``DagFileProcessor.process_file()``."""
-        if not self.done:
-            raise AirflowException("Tried to get the result before it's done!")
-        return self._result
-
-    @property
-    def start_time(self) -> datetime:
-        """Time when this started to process the file."""
-        if self._start_time is None:
-            raise AirflowException("Tried to get start time before it 
started!")
-        return self._start_time
-
-    @property
-    def waitable_handle(self):
-        return self._process.sentinel
-
-    def import_modules(self, file_path: str | Iterable[str]):
-        def _import_modules(filepath):
-            for module in iter_airflow_imports(filepath):
-                try:
-                    importlib.import_module(module)
-                except Exception as e:
-                    # only log as warning because an error here is not 
preventing anything from working, and
-                    # if it's serious, it's going to be surfaced to the user 
when the dag is actually parsed.
-                    self.log.warning(
-                        "Error when trying to pre-import module '%s' found in 
%s: %s",
-                        module,
-                        file_path,
-                        e,
-                    )
-
-        if isinstance(file_path, str):
-            _import_modules(file_path)
-        elif isinstance(file_path, Iterable):
-            for path in file_path:
-                _import_modules(path)
-
-
-class DagFileProcessor(LoggingMixin):
[email protected]()
+class DagFileProcessorProcess(WatchedSubprocess):
     """
-    Process a Python file containing Airflow DAGs.
-
-    This includes:
-
-    1. Execute the file and look for DAG objects in the namespace.
-    2. Execute any Callbacks if passed to DagFileProcessor.process_file
-    3. Serialize the DAGs and save it to DB (or update existing record in the 
DB).
-    4. Record any errors importing the file into ORM
+    Parses dags with Task SDK API.
 
-    Returns a tuple of 'number of dags found' and 'the count of import errors'
-
-    :param log: Logger to save the processing process
+    Since DAGs are written with the Task SDK, we need to parse them in a task 
SDK process such that
+    we can use the Task SDK definitions when serializing. This prevents 
potential conflicts with classes
+    in core Airflow.
     """
 
-    UNIT_TEST_MODE: bool = conf.getboolean("core", "UNIT_TEST_MODE")
-
-    def __init__(self, dag_directory: str, log: logging.Logger):
-        super().__init__()
-        self._log = log
-        self._dag_directory = dag_directory
-        self._last_num_of_db_queries = 0
+    parsing_result: DagFileParsingResult | None = None
 
     @classmethod
-    @provide_session
-    def execute_callbacks(
+    def start(  # type: ignore[override]
         cls,
-        dagbag: DagBag,
-        callback_requests: list[CallbackRequest],
-        unit_test_mode: bool,
-        session: Session = NEW_SESSION,
-    ) -> None:
-        """
-        Execute on failure callbacks.
-
-        These objects can come from SchedulerJobRunner or from 
DagProcessorJobRunner.
-
-        :param dagbag: Dag Bag of dags
-        :param callback_requests: failure callbacks to execute
-        :param session: DB session.
-
-        :return: number of queries executed
-        """
-        for request in callback_requests:
-            cls.logger().debug("Processing Callback Request: %s", request)
-            try:
-                if isinstance(request, TaskCallbackRequest):
-                    cls._execute_task_callbacks(dagbag, request, 
unit_test_mode, session=session)
-                elif isinstance(request, DagCallbackRequest):
-                    cls._execute_dag_callbacks(dagbag, request, 
session=session)
-            except Exception:
-                cls.logger().exception(
-                    "Error executing %s callback for file: %s",
-                    request.__class__.__name__,
-                    request.full_filepath,
-                )
-        session.flush()
-        session.commit()
+        path: str | os.PathLike[str],
+        callbacks: list[CallbackRequest],
+        target: Callable[[], None] = _parse_file_entrypoint,
+        **kwargs,
+    ) -> Self:
+        return super().start(path, callbacks, target=target, client=None, 
**kwargs)  # type:ignore[arg-type]
+
+    def _on_child_started(  # type: ignore[override]
+        self, callbacks: list[CallbackRequest], path: str | os.PathLike[str], 
child_comms_fd: int
+    ):

Review Comment:
   ```suggestion
       ) -> None:
   ```



##########
airflow/dag_processing/processor.py:
##########
@@ -16,610 +16,228 @@
 # under the License.
 from __future__ import annotations
 
-import importlib
-import logging
 import os
-import signal
-import threading
-import time
-import zipfile
-from collections.abc import Generator, Iterable
-from contextlib import contextmanager, redirect_stderr, redirect_stdout, 
suppress
-from dataclasses import dataclass
-from typing import TYPE_CHECKING
-
-from setproctitle import setproctitle
-from sqlalchemy import event
-
-from airflow import settings
+import sys
+import traceback
+from collections.abc import Generator
+from typing import TYPE_CHECKING, Annotated, Callable, Literal, Union
+
+import attrs
+import pydantic
+
 from airflow.callbacks.callback_requests import (
+    CallbackRequest,
     DagCallbackRequest,
     TaskCallbackRequest,
 )
 from airflow.configuration import conf
-from airflow.exceptions import AirflowException
-from airflow.models.dag import DAG
 from airflow.models.dagbag import DagBag
-from airflow.models.pool import Pool
-from airflow.models.serialized_dag import SerializedDagModel
-from airflow.models.taskinstance import TaskInstance, _run_finished_callback
+from airflow.sdk.execution_time.comms import GetConnection, GetVariable
+from airflow.sdk.execution_time.supervisor import WatchedSubprocess
+from airflow.serialization.serialized_objects import LazyDeserializedDAG, 
SerializedDAG
 from airflow.stats import Stats
-from airflow.utils import timezone
-from airflow.utils.file import iter_airflow_imports, might_contain_dag
-from airflow.utils.log.logging_mixin import LoggingMixin, StreamLogWriter, 
set_context
-from airflow.utils.mixins import MultiprocessingStartMethodMixin
-from airflow.utils.session import NEW_SESSION, provide_session
-from airflow.utils.state import TaskInstanceState
 
 if TYPE_CHECKING:
-    import multiprocessing
-    from datetime import datetime
-    from multiprocessing.connection import Connection as 
MultiprocessingConnection
-
-    from sqlalchemy.orm.session import Session
-
-    from airflow.callbacks.callback_requests import CallbackRequest
-    from airflow.models.operator import Operator
+    from airflow.typing_compat import Self
+    from airflow.utils.context import Context
+
+
+def _parse_file_entrypoint():
+    import os
+
+    import structlog
+
+    from airflow.sdk.execution_time import task_runner
+    # Parse DAG file, send JSON back up!
+
+    comms_decoder = task_runner.CommsDecoder[DagFileParseRequest, 
DagFileParsingResult](
+        input=sys.stdin,
+        decoder=pydantic.TypeAdapter[DagFileParseRequest](DagFileParseRequest),
+    )
+    msg = comms_decoder.get_message()
+    comms_decoder.request_socket = os.fdopen(msg.requests_fd, "wb", 
buffering=0)
+
+    log = structlog.get_logger(logger_name="task")
+
+    result = _parse_file(msg, log)
+    comms_decoder.send_request(log, result)
+
+
+def _parse_file(msg: DagFileParseRequest, log):
+    # TODO: Set known_pool names on DagBag!
+    bag = DagBag(
+        dag_folder=msg.file,
+        include_examples=False,
+        safe_mode=True,
+        load_op_links=False,
+    )
+    serialized_dags, serialization_import_errors = _serialize_dags(bag, log)
+    bag.import_errors.update(serialization_import_errors)
+    dags = [LazyDeserializedDAG(data=serdag) for serdag in serialized_dags]
+    result = DagFileParsingResult(
+        fileloc=msg.file,
+        serialized_dags=dags,
+        import_errors=bag.import_errors,
+        # TODO: Make `bag.dag_warnings` not return SQLA model objects
+        warnings=[],
+    )
+
+    if msg.callback_requests:
+        _execute_callbacks(bag, msg.callback_requests, log)
+    return result
+
+
+def _serialize_dags(bag, log):
+    serialization_import_errors = {}
+    serialized_dags = []
+    for dag in bag.dags.values():
+        try:
+            serialized_dag = SerializedDAG.to_dict(dag)
+            serialized_dags.append(serialized_dag)
+        except Exception:
+            log.exception("Failed to serialize DAG: %s", dag.fileloc)
+            dagbag_import_error_traceback_depth = conf.getint(
+                "core", "dagbag_import_error_traceback_depth", fallback=None
+            )
+            serialization_import_errors[dag.fileloc] = traceback.format_exc(
+                limit=-dagbag_import_error_traceback_depth
+            )
+    return serialized_dags, serialization_import_errors
 
 
-@dataclass
-class _QueryCounter:
-    queries_number: int = 0
+def _execute_callbacks(dagbag: DagBag, callback_requests: 
list[CallbackRequest], log):
+    for request in callback_requests:
+        log.debug("Processing Callback Request", request=request)
+        if isinstance(request, TaskCallbackRequest):
+            raise NotImplementedError("Haven't coded Task callback yet!")
+            # _execute_task_callbacks(dagbag, request)
+        elif isinstance(request, DagCallbackRequest):
+            _execute_dag_callbacks(dagbag, request, log)
 
-    def inc(self):
-        self.queries_number += 1
 
+def _execute_dag_callbacks(dagbag: DagBag, request: DagCallbackRequest, log):
+    dag = dagbag.dags[request.dag_id]
 
-@contextmanager
-def count_queries(session: Session) -> Generator[_QueryCounter, None, None]:
-    # using list allows to read the updated counter from what context manager 
returns
-    counter: _QueryCounter = _QueryCounter()
+    callbacks = dag.on_failure_callback if request.is_failure_callback else 
dag.on_success_callback
+    if not callbacks:
+        log.warning("Callback requested, but dag didn't have any", 
dag_id=request.dag_id)
+        return
 
-    @event.listens_for(session, "do_orm_execute")
-    def _count_db_queries(orm_execute_state):
-        nonlocal counter
-        counter.inc()
+    callbacks = callbacks if isinstance(callbacks, list) else [callbacks]
+    # TODO:We need a proper context object!
+    context: Context = {}  # type: ignore[assignment]
 
-    yield counter
-    event.remove(session, "do_orm_execute", _count_db_queries)
+    for callback in callbacks:
+        log.info(
+            "Executing on_%s dag callback",
+            "failure" if request.is_failure_callback else "success",
+            fn=callback,
+            dag_id=request.dag_id,
+        )
+        try:
+            callback(context)
+        except Exception:
+            log.exception("Callback failed", dag_id=request.dag_id)
+            Stats.incr("dag.callback_exceptions", tags={"dag_id": 
request.dag_id})
 
 
-class DagFileProcessorProcess(LoggingMixin, MultiprocessingStartMethodMixin):
+class DagFileParseRequest(pydantic.BaseModel):
     """
-    Runs DAG processing in a separate process using DagFileProcessor.
+    Request for DAG File Parsing.
 
-    :param file_path: a Python file containing Airflow DAG definitions
-    :param callback_requests: failure callback to execute
+    This is the request that the manager will send to the DAG parser with the 
dag file and
+    any other necessary metadata.
     """
 
-    # Counter that increments every time an instance of this class is created
-    class_creation_counter = 0
-
-    def __init__(
-        self,
-        file_path: str,
-        dag_directory: str,
-        callback_requests: list[CallbackRequest],
-    ):
-        super().__init__()
-        self._file_path = file_path
-        self._dag_directory = dag_directory
-        self._callback_requests = callback_requests
-
-        # The process that was launched to process the given DAG file.
-        self._process: multiprocessing.process.BaseProcess | None = None
-        # The result of DagFileProcessor.process_file(file_path).
-        self._result: tuple[int, int, int] | None = None
-        # Whether the process is done running.
-        self._done = False
-        # When the process started.
-        self._start_time: datetime | None = None
-        # This ID is used to uniquely name the process / thread that's launched
-        # by this processor instance
-        self._instance_id = DagFileProcessorProcess.class_creation_counter
-
-        self._parent_channel: MultiprocessingConnection | None = None
-        DagFileProcessorProcess.class_creation_counter += 1
-
-    @property
-    def file_path(self) -> str:
-        return self._file_path
-
-    @staticmethod
-    def _run_file_processor(
-        result_channel: MultiprocessingConnection,
-        parent_channel: MultiprocessingConnection,
-        file_path: str,
-        thread_name: str,
-        dag_directory: str,
-        callback_requests: list[CallbackRequest],
-        known_pools: set[str] | None = None,
-    ) -> None:
-        """
-        Process the given file.
-
-        :param result_channel: the connection to use for passing back the 
result
-        :param parent_channel: the parent end of the channel to close in the 
child
-        :param file_path: the file to process
-        :param thread_name: the name to use for the process that is launched
-        :param callback_requests: failure callback to execute
-        :return: the process that was launched
-        """
-        # This helper runs in the newly created process
-        log: logging.Logger = logging.getLogger("airflow.processor")
-
-        # Since we share all open FDs from the parent, we need to close the 
parent side of the pipe here in
-        # the child, else it won't get closed properly until we exit.
-        parent_channel.close()
-        del parent_channel
-
-        set_context(log, file_path)
-        setproctitle(f"airflow scheduler - DagFileProcessor {file_path}")
-
-        def _handle_dag_file_processing():
-            # Re-configure the ORM engine as there are issues with multiple 
processes
-            settings.configure_orm()
-
-            # Change the thread name to differentiate log lines. This is
-            # really a separate process, but changing the name of the
-            # process doesn't work, so changing the thread name instead.
-            threading.current_thread().name = thread_name
-
-            log.info("Started process (PID=%s) to work on %s", os.getpid(), 
file_path)
-            dag_file_processor = DagFileProcessor(dag_directory=dag_directory, 
log=log)
-            result: tuple[int, int, int] = dag_file_processor.process_file(
-                file_path=file_path,
-                callback_requests=callback_requests,
-                known_pools=known_pools,
-            )
-            result_channel.send(result)
-
-        try:
-            DAG_PROCESSOR_LOG_TARGET = conf.get_mandatory_value("logging", 
"DAG_PROCESSOR_LOG_TARGET")
-            if DAG_PROCESSOR_LOG_TARGET == "stdout":
-                with Stats.timer() as timer:
-                    _handle_dag_file_processing()
-            else:
-                # The following line ensures that stdout goes to the same 
destination as the logs. If stdout
-                # gets sent to logs and logs are sent to stdout, this leads to 
an infinite loop. This
-                # necessitates this conditional based on the value of 
DAG_PROCESSOR_LOG_TARGET.
-                with (
-                    redirect_stdout(StreamLogWriter(log, logging.INFO)),
-                    redirect_stderr(StreamLogWriter(log, logging.WARNING)),
-                    Stats.timer() as timer,
-                ):
-                    _handle_dag_file_processing()
-            log.info("Processing %s took %.3f seconds", file_path, 
timer.duration)
-        except Exception:
-            # Log exceptions through the logging framework.
-            log.exception("Got an exception! Propagating...")
-            raise
-        finally:
-            # We re-initialized the ORM within this Process above so we need to
-            # tear it down manually here
-            settings.dispose_orm()
-
-            result_channel.close()
-
-    def start(self) -> None:
-        """Launch the process and start processing the DAG."""
-        if conf.getboolean("scheduler", "parsing_pre_import_modules", 
fallback=True):
-            # Read the file to pre-import airflow modules used.
-            # This prevents them from being re-imported from zero in each 
"processing" process
-            # and saves CPU time and memory.
-            zip_file_paths = []
-            if zipfile.is_zipfile(self.file_path):
-                try:
-                    with zipfile.ZipFile(self.file_path) as z:
-                        zip_file_paths.extend(
-                            [
-                                os.path.join(self.file_path, info.filename)
-                                for info in z.infolist()
-                                if might_contain_dag(info.filename, True, z)
-                            ]
-                        )
-                except zipfile.BadZipFile as err:
-                    self.log.error("There was an err accessing %s, %s", 
self.file_path, err)
-            if zip_file_paths:
-                self.import_modules(zip_file_paths)
-            else:
-                self.import_modules(self.file_path)
-
-        context = self._get_multiprocessing_context()
-
-        pool_names = {p.pool for p in Pool.get_pools()}
-
-        _parent_channel, _child_channel = context.Pipe(duplex=False)
-        process = context.Process(
-            target=type(self)._run_file_processor,
-            args=(
-                _child_channel,
-                _parent_channel,
-                self.file_path,
-                f"DagFileProcessor{self._instance_id}",
-                self._dag_directory,
-                self._callback_requests,
-                pool_names,
-            ),
-            name=f"DagFileProcessor{self._instance_id}-Process",
-        )
-        self._process = process
-        self._start_time = timezone.utcnow()
-        process.start()
-
-        # Close the child side of the pipe now the subprocess has started -- 
otherwise this would prevent it
-        # from closing in some cases
-        _child_channel.close()
-        del _child_channel
-
-        # Don't store it on self until after we've started the child process - 
we don't want to keep it from
-        # getting GCd/closed
-        self._parent_channel = _parent_channel
-
-    def kill(self) -> None:
-        """Kill the process launched to process the file, and ensure 
consistent state."""
-        if self._process is None:
-            raise AirflowException("Tried to kill before starting!")
-        self._kill_process()
-
-    def terminate(self, sigkill: bool = False) -> None:
-        """
-        Terminate (and then kill) the process launched to process the file.
-
-        :param sigkill: whether to issue a SIGKILL if SIGTERM doesn't work.
-        """
-        if self._process is None or self._parent_channel is None:
-            raise AirflowException("Tried to call terminate before starting!")
-
-        self._process.terminate()
-        # Arbitrarily wait 5s for the process to die
-        with suppress(TimeoutError):
-            self._process._popen.wait(5)  # type: ignore
-        if sigkill:
-            self._kill_process()
-        self._parent_channel.close()
-
-    def _kill_process(self) -> None:
-        if self._process is None:
-            raise AirflowException("Tried to kill process before starting!")
-
-        if self._process.is_alive() and self._process.pid:
-            self.log.warning("Killing DAGFileProcessorProcess (PID=%d)", 
self._process.pid)
-            os.kill(self._process.pid, signal.SIGKILL)
-
-            # Reap the spawned zombie. We active wait, because in Python 3.9 
`waitpid` might lead to an
-            # exception, due to change in Python standard library and 
possibility of race condition
-            # see https://bugs.python.org/issue42558
-            while self._process._popen.poll() is None:  # type: ignore
-                time.sleep(0.001)
-        if self._parent_channel:
-            self._parent_channel.close()
+    file: str
+    requests_fd: int
+    callback_requests: list[CallbackRequest] = 
pydantic.Field(default_factory=list)
+    type: Literal["DagFileParseRequest"] = "DagFileParseRequest"
 
-    @property
-    def pid(self) -> int:
-        """PID of the process launched to process the given file."""
-        if self._process is None or self._process.pid is None:
-            raise AirflowException("Tried to get PID before starting!")
-        return self._process.pid
 
-    @property
-    def exit_code(self) -> int | None:
-        """
-        After the process is finished, this can be called to get the return 
code.
+class DagFileParsingResult(pydantic.BaseModel):
+    """
+    Result of DAG File Parsing.
 
-        :return: the exit code of the process
-        """
-        if self._process is None:
-            raise AirflowException("Tried to get exit code before starting!")
-        if not self._done:
-            raise AirflowException("Tried to call retcode before process was 
finished!")
-        return self._process.exitcode
+    This is the result of a successful DAG parse, in this class, we gather all 
serialized DAGs,
+    import errors and warnings to send back to the scheduler to store in the 
DB.
+    """
 
-    @property
-    def done(self) -> bool:
-        """
-        Check if the process launched to process this file is done.
+    fileloc: str
+    serialized_dags: list[LazyDeserializedDAG]
+    warnings: list | None = None
+    import_errors: dict[str, str] | None = None
+    type: Literal["DagFileParsingResult"] = "DagFileParsingResult"
 
-        :return: whether the process is finished running
-        """
-        if self._process is None or self._parent_channel is None:
-            raise AirflowException("Tried to see if it's done before 
starting!")
 
-        if self._done:
-            return True
+ToParent = Annotated[
+    Union[DagFileParsingResult, GetConnection, GetVariable],
+    pydantic.Field(discriminator="type"),
+]
 
-        if self._parent_channel.poll():
-            try:
-                self._result = self._parent_channel.recv()
-                self._done = True
-                self.log.debug("Waiting for %s", self._process)
-                self._process.join()
-                self._parent_channel.close()
-                return True
-            except EOFError:
-                # If we get an EOFError, it means the child end of the pipe 
has been closed. This only happens
-                # in the finally block. But due to a possible race condition, 
the process may have not yet
-                # terminated (it could be doing cleanup/python shutdown 
still). So we kill it here after a
-                # "suitable" timeout.
-                self._done = True
-                # Arbitrary timeout -- error/race condition only, so this 
doesn't need to be tunable.
-                self._process.join(timeout=5)
-                if self._process.is_alive():
-                    # Didn't shut down cleanly - kill it
-                    self._kill_process()
-
-        if not self._process.is_alive():
-            self._done = True
-            self.log.debug("Waiting for %s", self._process)
-            self._process.join()
-            self._parent_channel.close()
-            return True
-
-        return False
 
-    @property
-    def result(self) -> tuple[int, int, int] | None:
-        """Result of running ``DagFileProcessor.process_file()``."""
-        if not self.done:
-            raise AirflowException("Tried to get the result before it's done!")
-        return self._result
-
-    @property
-    def start_time(self) -> datetime:
-        """Time when this started to process the file."""
-        if self._start_time is None:
-            raise AirflowException("Tried to get start time before it 
started!")
-        return self._start_time
-
-    @property
-    def waitable_handle(self):
-        return self._process.sentinel
-
-    def import_modules(self, file_path: str | Iterable[str]):
-        def _import_modules(filepath):
-            for module in iter_airflow_imports(filepath):
-                try:
-                    importlib.import_module(module)
-                except Exception as e:
-                    # only log as warning because an error here is not 
preventing anything from working, and
-                    # if it's serious, it's going to be surfaced to the user 
when the dag is actually parsed.
-                    self.log.warning(
-                        "Error when trying to pre-import module '%s' found in 
%s: %s",
-                        module,
-                        file_path,
-                        e,
-                    )
-
-        if isinstance(file_path, str):
-            _import_modules(file_path)
-        elif isinstance(file_path, Iterable):
-            for path in file_path:
-                _import_modules(path)
-
-
-class DagFileProcessor(LoggingMixin):
[email protected]()
+class DagFileProcessorProcess(WatchedSubprocess):
     """
-    Process a Python file containing Airflow DAGs.
-
-    This includes:
-
-    1. Execute the file and look for DAG objects in the namespace.
-    2. Execute any Callbacks if passed to DagFileProcessor.process_file
-    3. Serialize the DAGs and save it to DB (or update existing record in the 
DB).
-    4. Record any errors importing the file into ORM
+    Parses dags with Task SDK API.
 
-    Returns a tuple of 'number of dags found' and 'the count of import errors'
-
-    :param log: Logger to save the processing process
+    Since DAGs are written with the Task SDK, we need to parse them in a task 
SDK process such that
+    we can use the Task SDK definitions when serializing. This prevents 
potential conflicts with classes
+    in core Airflow.
     """
 
-    UNIT_TEST_MODE: bool = conf.getboolean("core", "UNIT_TEST_MODE")
-
-    def __init__(self, dag_directory: str, log: logging.Logger):
-        super().__init__()
-        self._log = log
-        self._dag_directory = dag_directory
-        self._last_num_of_db_queries = 0
+    parsing_result: DagFileParsingResult | None = None
 
     @classmethod
-    @provide_session
-    def execute_callbacks(
+    def start(  # type: ignore[override]
         cls,
-        dagbag: DagBag,
-        callback_requests: list[CallbackRequest],
-        unit_test_mode: bool,
-        session: Session = NEW_SESSION,
-    ) -> None:
-        """
-        Execute on failure callbacks.
-
-        These objects can come from SchedulerJobRunner or from 
DagProcessorJobRunner.
-
-        :param dagbag: Dag Bag of dags
-        :param callback_requests: failure callbacks to execute
-        :param session: DB session.
-
-        :return: number of queries executed
-        """
-        for request in callback_requests:
-            cls.logger().debug("Processing Callback Request: %s", request)
-            try:
-                if isinstance(request, TaskCallbackRequest):
-                    cls._execute_task_callbacks(dagbag, request, 
unit_test_mode, session=session)
-                elif isinstance(request, DagCallbackRequest):
-                    cls._execute_dag_callbacks(dagbag, request, 
session=session)
-            except Exception:
-                cls.logger().exception(
-                    "Error executing %s callback for file: %s",
-                    request.__class__.__name__,
-                    request.full_filepath,
-                )
-        session.flush()
-        session.commit()
+        path: str | os.PathLike[str],
+        callbacks: list[CallbackRequest],
+        target: Callable[[], None] = _parse_file_entrypoint,
+        **kwargs,
+    ) -> Self:
+        return super().start(path, callbacks, target=target, client=None, 
**kwargs)  # type:ignore[arg-type]
+
+    def _on_child_started(  # type: ignore[override]
+        self, callbacks: list[CallbackRequest], path: str | os.PathLike[str], 
child_comms_fd: int
+    ):
+        msg = DagFileParseRequest(
+            file=os.fspath(path),
+            requests_fd=child_comms_fd,
+            callback_requests=callbacks,
+        )
+        self.stdin.write(msg.model_dump_json().encode() + b"\n")
 
-    @classmethod
-    @provide_session
-    def execute_callbacks_without_dag(
-        cls, callback_requests: list[CallbackRequest], unit_test_mode: bool, 
session: Session = NEW_SESSION
-    ) -> None:
-        """
-        Execute what callbacks we can as "best effort" when the dag cannot be 
found/had parse errors.
-
-        This is so important so that tasks that failed when there is a parse
-        error don't get stuck in queued state.
-        """
-        for request in callback_requests:
-            cls.logger().debug("Processing Callback Request: %s", request)
-            if isinstance(request, TaskCallbackRequest):
-                cls._execute_task_callbacks(None, request, unit_test_mode, 
session)
-            else:
-                cls.logger().info(
-                    "Not executing %s callback for file %s as there was a dag 
parse error",
-                    request.__class__.__name__,
-                    request.full_filepath,
-                )
-        session.flush()
-        session.commit()
+    def handle_requests(self, log) -> Generator[None, bytes, None]:
+        # TODO: Make decoder an instance variable, then this can live in the 
base class
+        decoder = pydantic.TypeAdapter[ToParent](ToParent)
 
-    @classmethod
-    def _execute_dag_callbacks(cls, dagbag: DagBag, request: 
DagCallbackRequest, session: Session):
-        dag = dagbag.dags[request.dag_id]
-        callbacks, context = DAG.fetch_callback(
-            dag=dag,
-            run_id=request.run_id,
-            success=not request.is_failure_callback,
-            reason=request.msg,
-            session=session,
-        ) or (None, None)
-
-        if callbacks and context:
-            DAG.execute_callback(callbacks, context, dag.dag_id)
-
-    @classmethod
-    def _execute_task_callbacks(
-        cls, dagbag: DagBag | None, request: TaskCallbackRequest, 
unit_test_mode: bool, session: Session
-    ) -> None:
-        """
-        Execute the task callbacks.
-
-        :param dagbag: the DagBag to use to get the task instance
-        :param request: the task callback request
-        :param session: the session to use
-        """
-        try:
-            callback_type = TaskInstanceState(request.task_callback_type)
-        except ValueError:
-            callback_type = None
-        is_remote = callback_type in (TaskInstanceState.SUCCESS, 
TaskInstanceState.FAILED)
+        while True:
+            line = yield
 
-        # previously we ignored any request besides failures. now if given 
callback type directly,
-        # then we respect it and execute it. additionally because in this 
scenario the callback
-        # is submitted remotely, we assume there is no need to mess with 
state; we simply run
-        # the callback
+            try:
+                msg = decoder.validate_json(line)
+            except Exception:
+                log.exception("Unable to decode message", line=line)
+                continue
 
-        if not is_remote and not request.is_failure_callback:
-            return
+            self._handle_request(msg, log)  # type: ignore[arg-type]
 
-        simple_ti = request.simple_task_instance
-        ti = TaskInstance.get_task_instance(
-            dag_id=simple_ti.dag_id,
-            run_id=simple_ti.run_id,
-            task_id=simple_ti.task_id,
-            map_index=simple_ti.map_index,
-            session=session,
-        )
-
-        if not ti:
+    def _handle_request(self, msg: ToParent, log):  # type: ignore[override]

Review Comment:
   ```suggestion
       def _handle_request(self, msg: ToParent, log: FilteringBoundLogger) -> 
None:  # type: ignore[override]
   ```



-- 
This is an automated message from the Apache Git Service.
To respond to the message, please log on to GitHub and use the
URL above to go to the specific comment.

To unsubscribe, e-mail: [email protected]

For queries about this service, please contact Infrastructure at:
[email protected]

Re: [PR] Swap Dag Parsing to use the TaskSDK machinery. [airflow]

Reply via email to