Small fixes and better docstrings

stefannica · stefannica · commit 65c4de83684c · 2025-10-15T23:46:41.000+02:00
diff --git a/examples/weather_agent/pipelines/weather_agent.py b/examples/weather_agent/pipelines/weather_agent.py
@@ -1,6 +1,7 @@
 """Weather Agent Pipeline."""
 
 import os
+import time
 
 from pipelines.hooks import (
     InitConfig,
@@ -10,9 +11,10 @@
 from steps import analyze_weather_with_llm, get_weather
 
 from zenml import pipeline
-from zenml.config import DockerSettings
+from zenml.config import DeploymentSettings, DockerSettings
 
 # Import enums for type-safe capture mode configuration
+from zenml.config.deployment_settings import MiddlewareSpec
 from zenml.config.docker_settings import PythonPackageInstaller
 from zenml.config.resource_settings import ResourceSettings
 
@@ -22,6 +24,58 @@
     python_package_installer=PythonPackageInstaller.UV,
 )
 
+
+class RequestTimingMiddleware:
+    """ASGI middleware to measure request processing time.
+
+    Uses the standard ASGI interface (scope, receive, send) which works
+    across all ASGI frameworks: FastAPI, Django, Starlette, Quart, etc.
+    """
+
+    def __init__(self, app):
+        self.app = app
+
+    async def __call__(self, scope, receive, send):
+        """Process ASGI request with timing measurement.
+
+        Args:
+            scope: ASGI connection scope (contains request info).
+            receive: Async callable to receive ASGI events.
+            send: Async callable to send ASGI events.
+        """
+        if scope["type"] != "http":
+            return await self.app(scope, receive, send)
+
+        start_time = time.time()
+
+        async def send_wrapper(message):
+            """Intercept response to add timing header."""
+            if message["type"] == "http.response.start":
+                process_time = (time.time() - start_time) * 1000
+                headers = list(message.get("headers", []))
+                headers.append(
+                    (
+                        b"x-process-time-ms",
+                        str(process_time).encode(),
+                    )
+                )
+                message = {**message, "headers": headers}
+
+            await send(message)
+
+        await self.app(scope, receive, send_wrapper)
+
+
+deployment_settings = DeploymentSettings(
+    custom_middlewares=[
+        MiddlewareSpec(
+            middleware=RequestTimingMiddleware,
+            order=10,
+            native=True,
+        ),
+    ],
+)
+
 environment = {}
 if os.getenv("OPENAI_API_KEY"):
     environment["OPENAI_API_KEY"] = os.getenv("OPENAI_API_KEY")
@@ -34,6 +88,7 @@
     on_cleanup=cleanup_hook,
     settings={
         "docker": docker_settings,
+        "deployment": deployment_settings,
         "deployer.gcp": {
             "allow_unauthenticated": True,
             # "location": "us-central1",
diff --git a/src/zenml/config/deployment_settings.py b/src/zenml/config/deployment_settings.py
@@ -446,16 +446,131 @@ class SecureHeadersConfig(BaseModel):
 
 
 class DeploymentSettings(BaseSettings):
-    """Settings for the pipeline deployment."""
+    """Settings for the pipeline deployment.
+
+    Use these settings to fully customize all aspects of the uvicorn web server
+    and ASGI web application that constitute the pipeline deployment.
+
+    Note that these settings are only available at the pipeline level.
+
+    The following customizations can be used to configure aspects that are
+    framework-agnostic (i.e. not specific to a particular ASGI framework like
+    FastAPI, Django, Flask, etc.):
+
+    * the ASGI application details: `app_title`, `app_description`,
+    `app_version` and `app_kwargs`
+    * the URL paths for the various built-in endpoints: `root_url_path`,
+    `docs_url_path`, `redoc_url_path`, `invoke_url_path`, `health_url_path`,
+    `info_url_path` and `metrics_url_path`
+    * the location of dashboard static files can be provided to replace the
+    default UI that is included with the deployment ASGI application:
+    `dashboard_files_path`
+    * the CORS configuration: `cors`
+    * the secure headers configuration: `secure_headers`
+    * the thread pool size: `thread_pool_size`
+    * custom application startup and shutdown hooks: `startup_hook_source`,
+    `shutdown_hook_source`, `startup_hook_kwargs` and `shutdown_hook_kwargs`
+    * uvicorn server configuration: `uvicorn_host`, `uvicorn_port`,
+    `uvicorn_workers` and `uvicorn_kwargs`
+
+    In addition to the above, the following advanced features can be used to
+    customize the implementation-specific details of the deployment application:
+
+    * custom endpoints (e.g. custom metrics, custom health, etc.): `custom_endpoints`
+    * custom middlewares (e.g. authentication, logging, etc.): `custom_middlewares`
+    * application building extensions - these are pluggable components that can
+    be used to add advanced framework-specific features like custom authentication,
+    logging, metrics, etc.: `app_extensions`
+
+    Ultimately, if neither of the above are sufficient, the user can provide a
+    custom implementations for the two core components that are used to build
+    and run the deployment application itself:
+
+    * the deployment app runner - this is the component that is responsible for
+    building and running the ASGI application. It is represented by the
+    `zenml.deployers.server.BaseDeploymentAppRunner` class.
+    See: `deployment_app_runner_source` and `deployment_app_runner_kwargs`
+    * the deployment service - this is the component that is responsible for
+    handling the business logic of the pipeline deployment. It is represented by
+    the `zenml.deployers.server.BaseDeploymentService` class. See:
+    `deployment_service_source` and `deployment_service_kwargs`
+
+    Both of these base classes or their existing implementations can be extended
+    and provided as sources in the deployment settings to be loaded at runtime.
 
-    # This settings is only available at the pipeline level
+    Attributes:
+        app_title: Title of the deployment application.
+        app_description: Description of the deployment application.
+        app_version: Version of the deployment application.
+        app_kwargs: Arbitrary framework-specific keyword arguments to be passed
+            to the deployment ASGI application constructor.
+
+        include_default_endpoints: Whether to include the default endpoints in
+            the ASGI application.
+        include_default_middleware: Whether to include the default middleware
+            in the ASGI application.
+
+        root_url_path: Root URL path.
+        docs_url_path: URL path for the OpenAPI documentation endpoint.
+        redoc_url_path: URL path for the Redoc documentation endpoint.
+        invoke_url_path: URL path for the invoke endpoint.
+        health_url_path: URL path for the health check endpoint.
+        info_url_path: URL path for the info endpoint.
+        metrics_url_path: URL path for the metrics endpoint.
+        dashboard_files_path: Path where the dashboard static files are located.
+            This can be used to replace the default UI that is included with the
+            deployment ASGI application. The referenced directory must contain
+            at a minimum an `index.html` file and a `assets` directory. The path
+            can be absolute or relative to the root of the repository
+            initialized with `zenml init` or relative to the current working
+            directory.
+
+        cors: Configuration for CORS.
+        secure_headers: Configuration for secure headers.
+        thread_pool_size: Size of the thread pool for the ASGI application.
+
+        startup_hook: Custom startup hook for the ASGI application.
+        shutdown_hook: Custom shutdown hook for the ASGI application.
+        startup_hook_kwargs: Keyword arguments for the startup hook.
+        shutdown_hook_kwargs: Keyword arguments for the shutdown hook.
+
+        custom_endpoints: Custom endpoints for the ASGI application. See the
+            `EndpointSpec` class for more details.
+        custom_middlewares: Custom middlewares for the ASGI application. See the
+            `MiddlewareSpec` class for more details.
+        app_extensions: App extensions used to build the ASGI application. See
+            the `AppExtensionSpec` class for more details.
+
+        uvicorn_host: Host of the uvicorn server.
+        uvicorn_port: Port of the uvicorn server.
+        uvicorn_workers: Number of workers for the uvicorn server.
+        log_level: Log level for the deployment application.
+        uvicorn_kwargs: Keyword arguments for the uvicorn server.
+
+        deployment_app_runner_source: Source of the deployment app runner. Must
+            point to a class that extends the
+            `zenml.deployers.server.BaseDeploymentAppRunner` class.
+        deployment_app_runner_kwargs: Keyword arguments for the deployment app
+            runner. These will be passed to the constructor of the deployment app
+            runner class.
+        deployment_service_source: Source of the deployment service. Must point
+            to a class that extends the
+            `zenml.deployers.server.BaseDeploymentService` class.
+        deployment_service_kwargs: Keyword arguments for the deployment service.
+            These will be passed to the constructor of the deployment service class.
+    """
+
+    # These settings are only available at the pipeline level
     LEVEL: ClassVar[ConfigurationLevel] = ConfigurationLevel.PIPELINE
 
     app_title: Optional[str] = None
     app_description: Optional[str] = None
     app_version: Optional[str] = None
     app_kwargs: Dict[str, Any] = {}
 
+    include_default_endpoints: bool = True
+    include_default_middleware: bool = True
+
     root_url_path: str = DEFAULT_DEPLOYMENT_APP_ROOT_URL_PATH
     docs_url_path: str = DEFAULT_DEPLOYMENT_APP_DOCS_URL_PATH
     redoc_url_path: str = DEFAULT_DEPLOYMENT_APP_REDOC_URL_PATH
@@ -464,15 +579,15 @@ class DeploymentSettings(BaseSettings):
     info_url_path: str = DEFAULT_DEPLOYMENT_APP_INFO_URL_PATH
     metrics_url_path: str = DEFAULT_DEPLOYMENT_APP_METRICS_URL_PATH
 
-    dashboard_files_path: str = ""
+    dashboard_files_path: Optional[str] = None
 
     cors: CORSConfig = CORSConfig()
     secure_headers: SecureHeadersConfig = SecureHeadersConfig()
 
     thread_pool_size: int = DEFAULT_DEPLOYMENT_APP_THREAD_POOL_SIZE
 
-    startup_hook_source: Optional[SourceOrObjectField] = None
-    shutdown_hook_source: Optional[SourceOrObjectField] = None
+    startup_hook: Optional[SourceOrObjectField] = None
+    shutdown_hook: Optional[SourceOrObjectField] = None
     startup_hook_kwargs: Dict[str, Any] = {}
     shutdown_hook_kwargs: Dict[str, Any] = {}
 
@@ -483,12 +598,6 @@ class DeploymentSettings(BaseSettings):
     # Pluggable app extensions for advanced features
     app_extensions: Optional[List[AppExtensionSpec]] = None
 
-    # Include default endpoints in the deployment application
-    include_default_endpoints: bool = True
-
-    # Include default middleware in the deployment application
-    include_default_middleware: bool = True
-
     uvicorn_host: str = "0.0.0.0"
     uvicorn_port: int = 8000
     uvicorn_workers: int = 1
@@ -503,10 +612,10 @@ class DeploymentSettings(BaseSettings):
 
     def load_sources(self) -> None:
         """Load source string into callable."""
-        if self.startup_hook_source is not None:
-            self.startup_hook_source.load()
-        if self.shutdown_hook_source is not None:
-            self.shutdown_hook_source.load()
+        if self.startup_hook is not None:
+            self.startup_hook.load()
+        if self.shutdown_hook is not None:
+            self.shutdown_hook.load()
         if self.deployment_app_runner_source is not None:
             self.deployment_app_runner_source.load()
         if self.deployment_service_source is not None:
diff --git a/src/zenml/deployers/containerized_deployer.py b/src/zenml/deployers/containerized_deployer.py
@@ -38,7 +38,9 @@
 class ContainerizedDeployer(BaseDeployer, ABC):
     """Base class for all containerized deployers."""
 
-    CONTAINER_REQUIREMENTS: List[str] = []
+    # TODO: this needs to come from the deployment settings or from the
+    # app runner class itself
+    CONTAINER_REQUIREMENTS: List[str] = ["uvicorn", "fastapi", "secure~=0.3.0"]
 
     @staticmethod
     def get_image(snapshot: PipelineSnapshotResponse) -> str:
diff --git a/src/zenml/deployers/docker/docker_deployer.py b/src/zenml/deployers/docker/docker_deployer.py
@@ -135,7 +135,6 @@ def from_deployment(
 class DockerDeployer(ContainerizedDeployer):
     """Deployer responsible for deploying pipelines locally using Docker."""
 
-    CONTAINER_REQUIREMENTS: List[str] = ["uvicorn", "fastapi"]
     _docker_client: Optional[DockerClient] = None
 
     @property
diff --git a/src/zenml/deployers/server/app.py b/src/zenml/deployers/server/app.py
@@ -48,7 +48,7 @@
 )
 from zenml.deployers.server.service import (
     BasePipelineDeploymentService,
-    DefaultPipelineDeploymentService,
+    PipelineDeploymentService,
 )
 from zenml.integrations.registry import integration_registry
 from zenml.logger import get_logger
@@ -276,7 +276,7 @@ def load_deployment_service(
         )
         if settings.deployment_service_source is None:
             service_cls: Type[BasePipelineDeploymentService] = (
-                DefaultPipelineDeploymentService
+                PipelineDeploymentService
             )
         else:
             try:
@@ -647,10 +647,10 @@ def _run_startup_hook(self) -> None:
         Raises:
             ValueError: If the startup hook is not callable.
         """
-        if not self.settings.startup_hook_source:
+        if not self.settings.startup_hook:
             return
 
-        startup_hook = self.settings.startup_hook_source.load()
+        startup_hook = self.settings.startup_hook.load()
 
         if not callable(startup_hook):
             raise ValueError(
@@ -690,10 +690,10 @@ def _run_shutdown_hook(self) -> None:
         Raises:
             ValueError: If the shutdown hook is not callable.
         """
-        if not self.settings.shutdown_hook_source:
+        if not self.settings.shutdown_hook:
             return
 
-        shutdown_hook = self.settings.shutdown_hook_source.load()
+        shutdown_hook = self.settings.shutdown_hook.load()
 
         if not shutdown_hook:
             return
diff --git a/src/zenml/deployers/server/service.py b/src/zenml/deployers/server/service.py
@@ -312,7 +312,7 @@ class PipelineInvokeResponse(BaseDeploymentInvocationResponse):
             return PipelineInvokeRequest, PipelineInvokeResponse
 
 
-class DefaultPipelineDeploymentService(BasePipelineDeploymentService):
+class PipelineDeploymentService(BasePipelineDeploymentService):
     """Default pipeline deployment service implementation."""
 
     def initialize(self) -> None:
diff --git a/src/zenml/deployers/utils.py b/src/zenml/deployers/utils.py
@@ -21,7 +21,9 @@
 import requests
 
 from zenml.client import Client
-from zenml.config.deployment_settings import DEFAULT_DEPLOYMENT_APP_INVOKE_URL_PATH
+from zenml.config.deployment_settings import (
+    DEFAULT_DEPLOYMENT_APP_INVOKE_URL_PATH,
+)
 from zenml.config.step_configurations import Step
 from zenml.deployers.exceptions import (
     DeploymentHTTPError,
diff --git a/src/zenml/integrations/aws/deployers/aws_deployer.py b/src/zenml/integrations/aws/deployers/aws_deployer.py
@@ -253,8 +253,6 @@ def from_deployment(
 class AWSDeployer(ContainerizedDeployer):
     """Deployer responsible for deploying pipelines on AWS App Runner."""
 
-    CONTAINER_REQUIREMENTS: List[str] = ["uvicorn", "fastapi"]
-
     _boto_session: Optional[boto3.Session] = None
     _region: Optional[str] = None
     _app_runner_client: Optional[Any] = None
diff --git a/src/zenml/integrations/gcp/deployers/gcp_deployer.py b/src/zenml/integrations/gcp/deployers/gcp_deployer.py
@@ -247,8 +247,6 @@ def from_deployment(
 class GCPDeployer(ContainerizedDeployer, GoogleCredentialsMixin):
     """Deployer responsible for deploying pipelines on GCP Cloud Run."""
 
-    CONTAINER_REQUIREMENTS: List[str] = ["uvicorn", "fastapi"]
-
     _credentials: Optional[Any] = None
     _project_id: Optional[str] = None
     _cloud_run_client: Optional[run_v2.ServicesClient] = None
diff --git a/src/zenml/orchestrators/step_launcher.py b/src/zenml/orchestrators/step_launcher.py
@@ -26,7 +26,6 @@
     ENV_ZENML_STEP_OPERATOR,
     handle_bool_env_var,
 )
-from zenml.deployers.server import runtime
 from zenml.enums import ExecutionMode, ExecutionStatus
 from zenml.environment import get_run_environment_dict
 from zenml.exceptions import RunInterruptedException, RunStoppedException
@@ -424,6 +423,8 @@ def _run_step(
             step_run: The model of the current step run.
             force_write_logs: The context for the step logs.
         """
+        from zenml.deployers.server import runtime
+
         step_run_info = StepRunInfo(
             config=self._step.config,
             pipeline=self._snapshot.pipeline_configuration,
diff --git a/src/zenml/orchestrators/step_runner.py b/src/zenml/orchestrators/step_runner.py
diff --git a/src/zenml/utils/source_utils.py b/src/zenml/utils/source_utils.py