zenml-io
diff --git a/‎docs/book/component-guide/deployers/local.md‎
Lines changed: 1 addition & 0 deletions b/‎docs/book/component-guide/deployers/local.md‎
Lines changed: 1 addition & 0 deletions
diff --git a/‎docs/book/how-to/deployment/deployment_settings.md‎
Lines changed: 32 additions & 0 deletions b/‎docs/book/how-to/deployment/deployment_settings.md‎
Lines changed: 32 additions & 0 deletions
diff --git a/‎src/zenml/config/deployment_settings.py‎
Lines changed: 4 additions & 1 deletion b/‎src/zenml/config/deployment_settings.py‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎src/zenml/deployers/base_deployer.py‎
Lines changed: 61 additions & 0 deletions b/‎src/zenml/deployers/base_deployer.py‎
Lines changed: 61 additions & 0 deletions
diff --git a/‎src/zenml/deployers/local/local_deployer.py‎
Lines changed: 17 additions & 40 deletions b/‎src/zenml/deployers/local/local_deployer.py‎
Lines changed: 17 additions & 40 deletions
@@ -52,6 +52,7 @@ For additional configuration of the Local deployer, you can pass the following `
   * `port_range`: The range of ports to search for a free port. Defaults to `(8000, 65535)`.
   * `address`: The address that the deployment server will listen on. Defaults to `127.0.0.1`.
   * `blocking`: Whether to run the deployment in the current process instead of running it as a daemon process. Defaults to False. Use this if you want to debug issues with the deployment ASGI application itself.
+  * `auto_reload`: Whether to enable auto-reload for the uvicorn server. This is useful to speed up local development by automatically restarting the server when code changes are detected without requiring a re-provisioning of the entire deployment. Defaults to False. NOTE: the `auto_reload` setting has no effect on changes in the pipeline configuration, step configuration or stack configuration.
 
 Check out [this docs page](https://docs.zenml.io/concepts/steps_and_pipelines/configuration) for more information on how to specify settings.
 
 
@@ -241,6 +241,27 @@ A rudimentary playground dashboard is included with the ZenML python package tha
 When supplying your own custom dashboard, you may also need to [customize the security headers](./deployment_settings#secure-headers) to allow the dashboard to access various resources. For example, you may want to tweak the `Content-Security-Policy` header to allow the dashboard to access external javascript libraries, images, etc.
 {% endhint %}
 
+#### Jinja2 templates
+
+You can use a Jinja2 template to dynamically generate the `index.html` file that hosts the single-page application. This is useful if you want to dynamically generate the dashboard files based on the pipeline configuration, step configuration or stack configuration. A `service_info` variable is passed to the template that contains the service information, such as the service name, version, and description. This variable has the same structure as the `zenml.deployers.server.models.ServiceInfo` model.
+
+Example:
+
+```jinja2
+<html>
+<head>
+    <title>Pipeline: {{ service_info.pipeline.pipeline_name }}</title>
+    <meta charset="UTF-8">
+    <meta name="viewport" content="width=device-width, initial-scale=1.0">
+    <link rel="stylesheet" href="https://unpkg.com/mvp.css">
+</head>
+<body>
+    <h1>Pipeline: {{ service_info.pipeline.pipeline_name }}</h1>
+    <p>Deployment: {{ service_info.deployment.name }}</p>
+</body>
+</html>
+```
+
 ### CORS
 
 Fine-tune cross-origin access:
@@ -363,6 +384,17 @@ settings:
 
 Tune server runtime parameters for performance and topology:
 
+The following settings are available for tuning the uvicorn server:
+* `thread_pool_size`: the size of the thread pool for CPU-bound work offload.
+* `uvicorn_host`: the host to bind the uvicorn server to.
+* `uvicorn_port`: the port to bind the uvicorn server to.
+* `uvicorn_workers`: the number of workers to use for the uvicorn server.
+* `log_level`: the log level to use for the uvicorn server.
+* `uvicorn_reload`: whether to enable auto-reload for the uvicorn server. This is useful when using [the local Deployer stack component](https://docs.zenml.io/stacks/stack-components/deployers/docker) to speed up local development by automatically restarting the server when code changes are detected. NOTE: the `uvicorn_reload` setting has no effect on changes in the pipeline configuration, step configuration or stack configuration.
+* `uvicorn_kwargs`: a dictionary of keyword arguments to pass to the uvicorn server.
+
+The following settings are available:
+
 ```python
 from zenml.config import DeploymentSettings
 from zenml.enums import LoggingLevels
 
@@ -37,7 +37,7 @@
 
 logger = get_logger(__name__)
 
-DEFAULT_DEPLOYMENT_APP_THREAD_POOL_SIZE = 20
+DEFAULT_DEPLOYMENT_APP_THREAD_POOL_SIZE = 40
 
 DEFAULT_DEPLOYMENT_APP_SECURE_HEADERS_HSTS = (
     "max-age=63072000; includeSubdomains"
@@ -633,6 +633,8 @@ class DeploymentSettings(BaseSettings):
         uvicorn_host: Host of the uvicorn server.
         uvicorn_port: Port of the uvicorn server.
         uvicorn_workers: Number of workers for the uvicorn server.
+        uvicorn_reload: Whether to automatically reload the deployment when the
+            code changes.
         log_level: Log level for the deployment application.
         uvicorn_kwargs: Keyword arguments for the uvicorn server.
 
@@ -694,6 +696,7 @@ class DeploymentSettings(BaseSettings):
     uvicorn_host: str = "0.0.0.0"  # nosec
     uvicorn_port: int = 8000
     uvicorn_workers: int = 1
+    uvicorn_reload: bool = False
     log_level: LoggingLevels = LoggingLevels.INFO
 
     uvicorn_kwargs: Dict[str, Any] = {}
 
@@ -30,9 +30,12 @@
 )
 from uuid import UUID
 
+import requests
+
 from zenml.analytics.enums import AnalyticsEvent
 from zenml.analytics.utils import track_handler
 from zenml.client import Client
+from zenml.config import DeploymentDefaultEndpoints
 from zenml.config.base_settings import BaseSettings
 from zenml.constants import (
     ENV_ZENML_ACTIVE_PROJECT_ID,
@@ -300,6 +303,56 @@ def _generate_auth_key(self, key_length: int = 32) -> str:
         alphabet = string.ascii_letters + string.digits
         return "".join(secrets.choice(alphabet) for _ in range(key_length))
 
+    def _check_deployment_health(
+        self,
+        deployment: DeploymentResponse,
+    ) -> bool:
+        """Check if the deployment is healthy by calling its health check endpoint.
+
+        Args:
+            deployment: The deployment to check.
+
+        Returns:
+            True if the deployment is healthy, False otherwise.
+        """
+        assert deployment.snapshot, "Deployment snapshot not found"
+
+        settings = (
+            deployment.snapshot.pipeline_configuration.deployment_settings
+        )
+
+        # If the health check endpoint is disabled, we consider the deployment healthy.
+        if (
+            DeploymentDefaultEndpoints.HEALTH
+            not in settings.include_default_endpoints
+        ):
+            return True
+
+        if not deployment.url:
+            return False
+
+        health_check_path = f"{settings.root_url_path}{settings.api_url_path}{settings.health_url_path}"
+        health_check_url = f"{deployment.url}{health_check_path}"
+
+        # Attempt to connect to the deployment and check if it is healthy
+        try:
+            response = requests.get(health_check_url, timeout=3)
+            if response.status_code == 200:
+                return True
+            else:
+                logger.debug(
+                    f"Health check endpoint for deployment '{deployment.name}' "
+                    f"at '{health_check_url}' returned status code "
+                    f"{response.status_code}"
+                )
+                return False
+        except Exception as e:
+            logger.debug(
+                f"Health check endpoint for deployment '{deployment.name}' "
+                f"at '{health_check_url}' is not reachable: {e}"
+            )
+            return False
+
     def _poll_deployment(
         self,
         deployment: DeploymentResponse,
@@ -335,6 +388,11 @@ def _poll_deployment(
             )
             try:
                 deployment_state = self.do_get_deployment_state(deployment)
+
+                if deployment_state.status == DeploymentStatus.RUNNING:
+                    if not self._check_deployment_health(deployment):
+                        deployment_state.status = DeploymentStatus.PENDING
+
             except DeploymentNotFoundError:
                 deployment_state = DeploymentOperationalState(
                     status=DeploymentStatus.ABSENT
@@ -675,6 +733,9 @@ def refresh_deployment(
         )
         try:
             deployment_state = self.do_get_deployment_state(deployment)
+            if deployment_state.status == DeploymentStatus.RUNNING:
+                if not self._check_deployment_health(deployment):
+                    deployment_state.status = DeploymentStatus.PENDING
         except DeploymentNotFoundError:
             deployment_state.status = DeploymentStatus.ABSENT
         except DeployerError as e:
 
@@ -32,7 +32,6 @@
 from uuid import UUID
 
 import psutil
-import requests
 from pydantic import BaseModel
 
 from zenml.config.base_settings import BaseSettings
@@ -112,13 +111,16 @@ class LocalDeployerSettings(BaseDeployerSettings):
         address: Address to bind the server to.
         blocking: Whether to run the deployment in the current process instead
             of running it as a daemon process.
+        auto_reload: Whether to automatically reload the deployment when the
+            code changes.
     """
 
     port: Optional[int] = None
     allocate_port_if_busy: bool = True
     port_range: Tuple[int, int] = (8000, 65535)
     address: str = "127.0.0.1"
     blocking: bool = False
+    auto_reload: bool = False
 
 
 class LocalDeployerConfig(BaseDeployerConfig, LocalDeployerSettings):
@@ -230,6 +232,15 @@ def do_provision_deployment(
 
         existing_meta = LocalDeploymentMetadata.from_deployment(deployment)
 
+        if existing_meta.pid:
+            try:
+                stop_process(existing_meta.pid)
+            except Exception as e:
+                logger.warning(
+                    f"Failed to stop existing daemon process for deployment "
+                    f"'{deployment.name}' with PID {existing_meta.pid}: {e}"
+                )
+
         preferred_ports: List[int] = []
         if settings.port:
             preferred_ports.append(settings.port)
@@ -265,15 +276,6 @@ def do_provision_deployment(
         if not os.path.exists(runtime_dir):
             os.makedirs(runtime_dir, exist_ok=True)
 
-        if existing_meta.pid:
-            try:
-                stop_process(existing_meta.pid)
-            except Exception as e:
-                logger.warning(
-                    f"Failed to stop existing daemon process for deployment "
-                    f"'{deployment.name}' with PID {existing_meta.pid}: {e}"
-                )
-
         if settings.blocking:
             self._update_deployment(
                 deployment,
@@ -291,6 +293,7 @@ def do_provision_deployment(
                 deployment_id=deployment.id,
                 host=settings.address,
                 port=port,
+                reload=settings.auto_reload,
             )
             self._update_deployment(
                 deployment,
@@ -320,6 +323,9 @@ def do_provision_deployment(
             str(port),
         ]
 
+        if settings.auto_reload:
+            cmd.append("--reload")
+
         try:
             os.makedirs(os.path.dirname(log_file), exist_ok=True)
             proc = subprocess.Popen(
@@ -382,41 +388,12 @@ def do_get_deployment_state(
             return state
 
         # Use pending until we can confirm the daemon is reachable
-        state.status = DeploymentStatus.PENDING
+        state.status = DeploymentStatus.RUNNING
         address = meta.address
         if address == "0.0.0.0":  # nosec
             address = "localhost"
         state.url = f"http://{address}:{meta.port}"
 
-        settings = (
-            deployment.snapshot.pipeline_configuration.deployment_settings
-        )
-        health_check_path = f"{settings.root_url_path}{settings.api_url_path}{settings.health_url_path}"
-        health_check_url = f"{state.url}{health_check_path}"
-
-        # Attempt to connect to the daemon and set the status to RUNNING
-        # if successful
-        try:
-            response = requests.get(health_check_url, timeout=3)
-            if response.status_code == 200:
-                state.status = DeploymentStatus.RUNNING
-            else:
-                logger.debug(
-                    f"Daemon for deployment '{deployment.name}' returned "
-                    f"status code {response.status_code} for health check "
-                    f"at '{health_check_url}'"
-                )
-        except Exception as e:
-            logger.debug(
-                f"Daemon for deployment '{deployment.name}' is not "
-                f"reachable at '{health_check_url}': {e}"
-            )
-            # It can take a long time after the deployment is started until
-            # the deployment is ready to serve requests, but this isn't an
-            # error condition. We return PENDING instead of ERROR here to
-            # signal to the polling in the base deployer class to keep trying.
-            state.status = DeploymentStatus.PENDING
-
         state.metadata = meta.model_dump(exclude_none=True)
 
         return state