zenml-io
diff --git a/‎docker/base.Dockerfile‎
Lines changed: 5 additions & 2 deletions b/‎docker/base.Dockerfile‎
Lines changed: 5 additions & 2 deletions
diff --git a/‎docker/zenml-server-dev.Dockerfile‎
Lines changed: 6 additions & 4 deletions b/‎docker/zenml-server-dev.Dockerfile‎
Lines changed: 6 additions & 4 deletions
diff --git a/‎examples/stress-test/results.ipynb‎
Lines changed: 147 additions & 0 deletions b/‎examples/stress-test/results.ipynb‎
Lines changed: 147 additions & 0 deletions
diff --git a/‎examples/stress-test/run.py‎
Lines changed: 87 additions & 40 deletions b/‎examples/stress-test/run.py‎
Lines changed: 87 additions & 40 deletions
@@ -184,6 +184,8 @@ RUN groupadd --gid $USER_GID $USERNAME \
 COPY --chown=$USERNAME:$USER_GID --from=server-builder /opt/venv /opt/venv
 # Copy the requirements.txt file from the builder stage
 COPY --chown=$USERNAME:$USER_GID --from=server-builder /zenml/requirements.txt /zenml/requirements.txt
+COPY --chown=$USERNAME:$USER_GID scripts/docker-entrypoint.sh /entrypoint.sh
+RUN chmod +x /entrypoint.sh
 
 ENV PATH="$VIRTUAL_ENV/bin:/home/$USERNAME/.local/bin:$PATH"
 
@@ -192,5 +194,6 @@ USER $USERNAME
 
 # Start the ZenML server
 EXPOSE 8080
-ENTRYPOINT ["uvicorn", "zenml.zen_server.zen_server_api:app", "--log-level", "debug", "--no-server-header", "--proxy-headers", "--forwarded-allow-ips", "*"]
-CMD ["--port", "8080", "--host",  "0.0.0.0"]
+ENTRYPOINT ["/entrypoint.sh"]
+
+CMD ["uvicorn", "zenml.zen_server.zen_server_api:app", "--no-server-header", "--proxy-headers", "--forwarded-allow-ips", "*", "--port", "8080", "--host",  "0.0.0.0"]
@@ -138,6 +138,8 @@ COPY --chown=$USERNAME:$USER_GID --from=builder /zenml/requirements.txt /zenml/r
 # Copy source code
 COPY --chown=$USERNAME:$USER_GID README.md pyproject.toml ./
 COPY --chown=$USERNAME:$USER_GID src src
+COPY --chown=$USERNAME:$USER_GID scripts/docker-entrypoint.sh /entrypoint.sh
+RUN chmod +x /entrypoint.sh
 
 FROM common-runtime AS local-runtime
 
@@ -147,8 +149,8 @@ RUN pip install --no-deps --no-cache -e .[server,secrets-aws,secrets-gcp,secrets
 
 EXPOSE 8080
 
-ENTRYPOINT ["uvicorn", "zenml.zen_server.zen_server_api:app", "--log-level", "debug", "--no-server-header", "--proxy-headers", "--forwarded-allow-ips", "*", "--reload", "--access-log"]
-CMD ["--port", "8080", "--host",  "0.0.0.0"]
+ENTRYPOINT ["/entrypoint.sh"]
+CMD ["uvicorn", "zenml.zen_server.zen_server_api:app", "--log-level", "debug", "--no-server-header", "--proxy-headers", "--forwarded-allow-ips", "*", "--reload", "--port", "8080", "--host",  "0.0.0.0"]
 
 
 FROM common-runtime AS runtime
@@ -160,5 +162,5 @@ RUN pip install --no-deps --no-cache .[server,secrets-aws,secrets-gcp,secrets-az
 
 EXPOSE 8080
 
-ENTRYPOINT ["uvicorn", "zenml.zen_server.zen_server_api:app", "--log-level", "debug", "--no-server-header", "--proxy-headers", "--forwarded-allow-ips", "*", "--access-log"]
-CMD ["--port", "8080", "--host",  "0.0.0.0"]
+ENTRYPOINT ["/entrypoint.sh"]
+CMD ["uvicorn", "zenml.zen_server.zen_server_api:app", "--log-level", "debug", "--no-server-header", "--proxy-headers", "--forwarded-allow-ips", "*", "--port", "8080", "--host",  "0.0.0.0"]
@@ -0,0 +1,147 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "id": "63ab391a",
+   "metadata": {},
+   "source": [
+    "# Stress Test Results\n"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "id": "53e60d14",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "from utils import LogFile"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "id": "ee4c7fb0",
+   "metadata": {
+    "collapsed": true,
+    "jupyter": {
+     "outputs_hidden": true,
+     "source_hidden": true
+    }
+   },
+   "outputs": [],
+   "source": [
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-040-40th-1000-steps-30s-50-batch-no-rbac-endpoint-metrics.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-041-40th-1000-steps-30s-50-batch-no-rbac-no-service-connector.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-042-20th-1000-steps-30s-50-batch-no-rbac-no-service-connector.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-043-2th-1000-steps-30s-50-batch-no-rbac-no-service-connector.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-044-4th-1000-steps-30s-50-batch-no-rbac-no-service-connector.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-044-4th-1000-steps-30s-50-batch-no-rbac-no-service-connector-take-2.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-045-8th-1000-steps-30s-50-batch-no-rbac-no-service-connector.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-046-8th-1000-steps-30s-50-batch-no-rbac.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-047-2th-1000-steps-30s-50-batch-no-rbac.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-048-2th-1000-steps-30s-50-batch.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-049-4th-1000-steps-30s-50-batch.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-050-8th-1000-steps-30s-50-batch.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-050-8th-1000-steps-30s-50-batch-take-2.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-050-8th-1000-steps-30s-50-batch-take-3.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-051-8th-1000-steps-30s-50-batch-deduplication.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-052-8th-1000-steps-30s-50-batch-deduplication-take-2.txt\")\n",
+    "# log_file = LogFile.parse_logs(\"../../../../docs/aiml/zenml/stress-tests/server-logs-053-2th-1000-steps-30s-50-batch-deduplication.txt\")\n",
+    "log_file = LogFile.parse_logs(\n",
+    "    \"../../../../docs/aiml/zenml/stress-tests/server-logs-054-2th-1000-steps-30s-50-batch-deduplication-async-auth.txt\"\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "id": "425c47c5",
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# log_file.request_flows[\"b170dbe2\"]"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "4b7dab39",
+   "metadata": {
+    "collapsed": true,
+    "jupyter": {
+     "outputs_hidden": true,
+     "source_hidden": true
+    }
+   },
+   "outputs": [],
+   "source": [
+    "log_file.plot_request_flows(\n",
+    "    start_time=200,\n",
+    "    end_time=500,\n",
+    "    max_requests=5000,\n",
+    "    # pps=10,\n",
+    "    # width=2000,\n",
+    "    height=1000,\n",
+    "    width=1900,\n",
+    "    # pod=1,\n",
+    "    hide_legend=True,\n",
+    "    hide_y_axis=True,\n",
+    "    # api_call_filter=[\n",
+    "    #     \".*/api/v1/service_connectors/<uuid>/client\",\n",
+    "    #     \".*/api/v1/runs$\",\n",
+    "    #     \".*/api/v1/pipeline_deployments\",\n",
+    "    # ],\n",
+    "    # min_duration=1,\n",
+    "    # group_retry_requests=False,\n",
+    "    # filter_states=[LogType.SQL_STARTED, LogType.SQL_COMPLETED],\n",
+    "    request_id=\"88ddf46e\",\n",
+    ")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "id": "b84ef271",
+   "metadata": {
+    "collapsed": true,
+    "jupyter": {
+     "outputs_hidden": true,
+     "source_hidden": true
+    }
+   },
+   "outputs": [],
+   "source": [
+    "log_file.plot(\n",
+    "    log_file.get_plot_fn(\n",
+    "        y_metric=\"threads\",\n",
+    "        # y_metric=\"memory_usage\",\n",
+    "        # y_metric=\"active_requests\",\n",
+    "        label_attribute=\"pod\",\n",
+    "    ),\n",
+    ")"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": ".venv",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.10.12"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 5
+}
@@ -16,7 +16,7 @@
 #
 
 import time
-from typing import Annotated, Any, Dict, Tuple
+from typing import Annotated, Any, Dict, Optional, Tuple
 
 import click
 
@@ -29,45 +29,63 @@
 )
 from zenml.integrations.kubernetes.pod_settings import KubernetesPodSettings
 
-kubernetes_settings = KubernetesOrchestratorSettings(
-    pod_startup_timeout=600,
-    pod_settings=KubernetesPodSettings(
-        resources={
-            "requests": {"cpu": "100m", "memory": "500Mi"},
-            # "limits": {"memory": "500Mi"},    -> grows linearly with number of steps
-        },
-        node_selectors={"pool": "workloads"},
-        tolerations=[
-            {
-                "key": "pool",
-                "operator": "Equal",
-                "value": "workloads",
-                "effect": "NoSchedule",
-            }
-        ],
-        env=[{"name": "ZENML_LOGGING_VERBOSITY", "value": "debug"}],
-    ),
-    orchestrator_pod_settings=KubernetesPodSettings(
-        resources={
-            "requests": {"cpu": "100m", "memory": "500Mi"},
-            # "limits": {"memory": "500Mi"}, # -> grows linearly with number of steps
-        },
-        node_selectors={"pool": "workloads"},
-        tolerations=[
-            {
-                "key": "pool",
-                "operator": "Equal",
-                "value": "workloads",
-                "effect": "NoSchedule",
-            }
-        ],
-    ),
-)
+
+def get_kubernetes_settings(
+    max_parallelism: Optional[int],
+) -> KubernetesOrchestratorSettings:
+    """Get the Kubernetes settings for the ZenML server.
+
+    Args:
+        max_parallelism: The maximum number of parallel steps to run.
+
+    Returns:
+        The Kubernetes settings for the ZenML server.
+    """
+    return KubernetesOrchestratorSettings(
+        service_account_name="zenml-service-account",
+        pod_startup_timeout=600,
+        max_parallelism=max_parallelism,
+        pod_settings=KubernetesPodSettings(
+            resources={
+                "requests": {"cpu": "100m", "memory": "500Mi"},
+                # "limits": {"memory": "500Mi"},    -> grows linearly with number of steps
+            },
+            node_selectors={"pool": "workloads"},
+            tolerations=[
+                {
+                    "key": "pool",
+                    "operator": "Equal",
+                    "value": "workloads",
+                    "effect": "NoSchedule",
+                }
+            ],
+            env=[
+                {"name": "ZENML_LOGGING_VERBOSITY", "value": "debug"},
+                {"name": "ZENML_ENABLE_RICH_TRACEBACK", "value": "false"},
+            ],
+        ),
+        orchestrator_pod_settings=KubernetesPodSettings(
+            resources={
+                "requests": {"cpu": "100m", "memory": "500Mi"},
+                # "limits": {"memory": "500Mi"}, # -> grows linearly with number of steps
+            },
+            node_selectors={"pool": "workloads"},
+            tolerations=[
+                {
+                    "key": "pool",
+                    "operator": "Equal",
+                    "value": "workloads",
+                    "effect": "NoSchedule",
+                }
+            ],
+        ),
+    )
+
 
 docker_settings = DockerSettings(
     python_package_installer=PythonPackageInstaller.UV,
 )
-settings = {"docker": docker_settings, "orchestrator": kubernetes_settings}
+settings = {"docker": docker_settings}
 
 
 @step
@@ -243,6 +261,7 @@ def load_step(
 # The report results step is beefier than the load step because it has to fetch
 # all the artifacts from the run.
 report_kubernetes_settings = KubernetesOrchestratorSettings(
+    service_account_name="zenml-service-account",
     pod_settings=KubernetesPodSettings(
         resources={
             "requests": {"cpu": "100m", "memory": "800Mi"},
@@ -257,7 +276,10 @@ def load_step(
                 "effect": "NoSchedule",
             }
         ],
-        env=[{"name": "ZENML_LOGGING_VERBOSITY", "value": "debug"}],
+        env=[
+            {"name": "ZENML_LOGGING_VERBOSITY", "value": "debug"},
+            {"name": "ZENML_ENABLE_RICH_TRACEBACK", "value": "false"},
+        ],
     ),
 )
 
@@ -297,7 +319,7 @@ def report_results() -> None:
     print(f"Number of steps: {len(results)}")
 
 
-@pipeline(enable_cache=False, settings=settings)
+@pipeline(enable_cache=False)
 def load_test_pipeline(
     num_parallel_steps: int, duration: int, sleep_interval: float
 ) -> None:
@@ -360,8 +382,20 @@ def load_test_pipeline(
     type=int,
     show_default=True,
 )
+@click.option(
+    "--max-parallel-steps",
+    "-m",
+    help="Maximum number of parallel steps to run",
+    required=False,
+    default=None,
+    type=int,
+)
 def main(
-    parallel_steps: int, duration: int, sleep_interval: float, num_tags: int
+    parallel_steps: int,
+    duration: int,
+    sleep_interval: float,
+    num_tags: int,
+    max_parallel_steps: Optional[int] = None,
 ) -> None:
     """Execute a ZenML load test with configurable parallel steps.
 
@@ -373,12 +407,25 @@ def main(
         duration: The duration of the load test in seconds.
         sleep_interval: The interval to sleep between API calls in seconds.
         num_tags: The number of tags to add to the pipeline.
+        max_parallel_steps: The maximum number of parallel steps to run.
     """
-    click.echo(f"Starting load test with {parallel_steps} parallel steps...")
+    if max_parallel_steps:
+        click.echo(
+            f"Starting load test with {parallel_steps} parallel steps with "
+            f"max {max_parallel_steps} running steps at a time..."
+        )
+    else:
+        click.echo(
+            f"Starting load test with {parallel_steps} parallel steps..."
+        )
     click.echo(f"Duration: {duration}s, Sleep Interval: {sleep_interval}s")
 
+    kubernetes_settings = get_kubernetes_settings(max_parallel_steps)
+    settings["orchestrator"] = kubernetes_settings
+
     load_test_pipeline.configure(
         tags=[Tag(name=f"tag_{i}", cascade=True) for i in range(num_tags)],
+        settings=settings,
     )
 
     load_test_pipeline(