From a76d14cd03da768b3511934ecfb685d19f71b308 Mon Sep 17 00:00:00 2001
From: Frank Deng <dengjia@gmail.com>
Date: Thu, 4 Sep 2025 19:05:34 -0700
Subject: [PATCH 1/3] Add phoenix filter pipeline

---
 examples/filters/phoenix_pipeline.py | 110 +++++++++++++++++++++++++++
 1 file changed, 110 insertions(+)
 create mode 100644 examples/filters/phoenix_pipeline.py

diff --git a/examples/filters/phoenix_pipeline.py b/examples/filters/phoenix_pipeline.py
new file mode 100644
index 00000000..8d11a9d4
--- /dev/null
+++ b/examples/filters/phoenix_pipeline.py
@@ -0,0 +1,110 @@
+"""
+title: Phoenix Filter Pipeline
+author: jia.deng@cloudkitchens.com
+date: 2025-09-04
+version: 1.0
+license: MIT
+description: A pipeline for Phoenix integration
+requirements: arize-phoenix-otel
+"""
+
+from typing import List, Optional
+from pydantic import BaseModel
+import os
+
+import phoenix.otel
+
+class Pipeline:
+    class Valves(BaseModel):
+        # List target pipeline ids (models) that this filter will be connected to.
+        # If you want to connect this filter to all pipelines, you can set pipelines to ["*"]
+        # e.g. ["llama3:latest", "gpt-3.5-turbo"]
+        pipelines: List[str] = []
+
+        # Assign a priority level to the filter pipeline.
+        # The priority level determines the order in which the filter pipelines are executed.
+        # The lower the number, the higher the priority.
+        priority: int = 0
+
+    def __init__(self):
+        # Pipeline filters are only compatible with Open WebUI
+        # You can think of filter pipeline as a middleware that can be used to edit the form data before it is sent to the OpenAI API.
+        self.type = "filter"
+
+        # Optionally, you can set the id and name of the pipeline.
+        # Best practice is to not specify the id so that it can be automatically inferred from the filename, so that users can install multiple versions of the same pipeline.
+        # The identifier must be unique across all pipelines.
+        # The identifier must be an alphanumeric string that can include underscores or hyphens. It cannot contain spaces, special characters, slashes, or backslashes.
+        # self.id = "phoenix_filter_pipeline"
+        self.name = "Phoenix Filter"
+
+        # Initialize
+        self.valves = self.Valves(
+            **{
+                "pipelines": ["*"],  # Connect to all pipelines
+            }
+        )
+
+        self.tracer = None
+
+    async def on_startup(self):
+        # This function is called when the server is started.
+        print(f"on_startup: {__name__}")
+        self._set_tracer()
+
+    async def on_shutdown(self):
+        # This function is called when the server is stopped.
+        print(f"on_shutdown: {__name__}")
+
+    async def on_valves_updated(self):
+        # This function is called when the valves are updated.
+        print(f"on_valves_updated: {__name__}")
+        # reset tracer
+        self._set_tracer()
+
+    async def inlet(self, body: dict, user: Optional[dict] = None) -> dict:
+        # This filter is applied to the form data before it is sent to the OpenAI API.
+        print(f"inlet: {__name__}")
+
+        if self.tracer is None:
+            print("[WARNING] tracer is initialized")
+            return body
+
+        print(f"Inlet function called with body: {body} and user: {user}")
+
+        user_message = body["messages"][-1]["content"]
+        with self.tracer.start_as_current_span("inlet") as span:
+            span.set_attribute("user.id", user.get("id", "unknown") if user else "unknown")
+            span.set_attribute("user_message.length", len(user_message))
+            span.set_attribute("user_message.content", user_message[:100])
+
+        return body
+
+    async def outlet(self, body: dict, user: Optional[dict] = None) -> dict:
+        print(f"outlet: {__name__}")
+
+        if self.tracer is None:
+            print("[WARNING] tracer is initialized")
+            return body
+
+        print(f"Outlet function called with body: {body} and user: {user}")
+
+        with self.tracer.start_as_current_span("outlet") as span:
+            span.set_attribute("user.id", user.get("id", "unknown") if user else "unknown")
+
+        return body
+
+    def _set_tracer(self) -> None:
+
+        tracer_provider = phoenix.otel.register(
+            project_name=os.getenv("PHOENIX_PROJECT_NAME", "open-webui-pipelines"),
+            endpoint=os.getenv(
+                "PHOENIX_ENDPOINT",
+                "http://phoenix.phoenix.svc.cluster.local/v1/traces",
+            ),
+            auto_instrument=True,
+            set_global_tracer_provider=False,
+            batch=True,
+        )
+
+        self.tracer = tracer_provider.get_tracer(__name__)
\ No newline at end of file

From 9c026dc9540c7b28a2b8dc8d848f9687bda6aebb Mon Sep 17 00:00:00 2001
From: Frank Deng <dengjia@gmail.com>
Date: Wed, 10 Sep 2025 13:43:24 -0700
Subject: [PATCH 2/3] Implementation

---
 examples/filters/phoenix_pipeline.py | 355 ++++++++++++++++++++++++---
 1 file changed, 315 insertions(+), 40 deletions(-)

diff --git a/examples/filters/phoenix_pipeline.py b/examples/filters/phoenix_pipeline.py
index 8d11a9d4..6b764db1 100644
--- a/examples/filters/phoenix_pipeline.py
+++ b/examples/filters/phoenix_pipeline.py
@@ -1,96 +1,371 @@
 """
 title: Phoenix Filter Pipeline
 author: jia.deng@cloudkitchens.com
-date: 2025-09-04
+date: 2025-09-09
 version: 1.0
 license: MIT
 description: A pipeline for Phoenix integration
 requirements: arize-phoenix-otel
 """
 
-from typing import List, Optional
-from pydantic import BaseModel
+import logging
+import json
 import os
+from collections.abc import Iterator
+from typing import Any
+
 
+from pydantic import BaseModel
 import phoenix.otel
+from openinference.instrumentation import using_attributes, OITracer
+from openinference.semconv.trace import (
+    MessageAttributes,
+    OpenInferenceMimeTypeValues,
+    OpenInferenceSpanKindValues,
+    SpanAttributes,
+)
+from opentelemetry.trace import use_span, Span
+
+logger = logging.getLogger(__name__)
+logging.basicConfig(
+    level=logging.INFO,
+    format="%(asctime)s %(levelname)s [%(filename)s:%(lineno)d] %(message)s",
+    datefmt="%Y-%m-%d %H:%M:%S",
+)
+
+
+def _llm_span_kind_attributes() -> Iterator[tuple[str, str]]:
+    """
+    Yields the OpenInference span kind attribute for LLMs.
+    """
+    yield SpanAttributes.OPENINFERENCE_SPAN_KIND, OpenInferenceSpanKindValues.LLM.value
+
+
+def _llm_model_name_attributes(model_name: str) -> Iterator[tuple[str, str]]:
+    """
+    Yields the OpenInference model name attribute.
+    """
+    yield SpanAttributes.LLM_MODEL_NAME, model_name
+
+
+def _input_attributes(payload: Any) -> Iterator[tuple[str, str]]:
+    """
+    Yields the OpenInference input value attribute as a JSON string if the
+    payload can be serialized as JSON, otherwise as a string.
+    """
+    try:
+        yield SpanAttributes.INPUT_VALUE, json.dumps(payload)
+        yield SpanAttributes.INPUT_MIME_TYPE, OpenInferenceMimeTypeValues.JSON.value
+    except json.JSONDecodeError:
+        yield SpanAttributes.INPUT_VALUE, str(payload)
+        yield SpanAttributes.INPUT_MIME_TYPE, OpenInferenceMimeTypeValues.TEXT.value
+
+
+def _llm_input_messages_attributes(
+    messages: list[dict[str, Any]],
+) -> Iterator[tuple[str, str]]:
+    """
+    Yields the OpenInference input messages attributes for each message in the list.
+    """
+    for messages_index, message in enumerate(messages):
+        yield (
+            f"{SpanAttributes.LLM_INPUT_MESSAGES}.{messages_index}."
+            f"{MessageAttributes.MESSAGE_ROLE}",
+            message.get("role", ""),
+        )
+        yield (
+            f"{SpanAttributes.LLM_INPUT_MESSAGES}.{messages_index}."
+            f"{MessageAttributes.MESSAGE_CONTENT}",
+            message.get("content", ""),
+        )
 
+
+def _metadata_attributes(metadata: dict[str, Any]) -> Iterator[tuple[str, str]]:
+    """
+    Yields the OpenInference metadata attributes.
+    """
+
+    def flatten(prefix: str, value: Any) -> Iterator[tuple[str, str]]:
+        if isinstance(value, dict):
+            for k, v in value.items():
+                yield from flatten(f"{prefix}.{k}", v)
+        elif isinstance(value, list):
+            for i, v in enumerate(value):
+                yield from flatten(f"{prefix}.{i}", v)
+        else:
+            yield prefix, str(value)
+
+    for key, value in metadata.items():
+        yield from flatten(f"{SpanAttributes.METADATA}.{key}", value)
+
+
+def _output_attributes(payload: Any) -> Iterator[tuple[str, str]]:
+    """
+    Yields the OpenInference output value attribute as a JSON string if the
+    payload can be serialized as JSON, otherwise as a string.
+    """
+    try:
+        yield SpanAttributes.OUTPUT_VALUE, json.dumps(payload)
+        yield SpanAttributes.OUTPUT_MIME_TYPE, OpenInferenceMimeTypeValues.JSON.value
+    except TypeError:
+        yield SpanAttributes.OUTPUT_VALUE, str(payload)
+        yield SpanAttributes.OUTPUT_MIME_TYPE, OpenInferenceMimeTypeValues.TEXT.value
+
+
+def _llm_output_message_attributes(
+    message: dict[str, Any]
+) -> Iterator[tuple[str, str]]:
+    """
+    Yields the OpenInference output message attributes.
+    """
+    yield (
+        f"{SpanAttributes.LLM_OUTPUT_MESSAGES}.0.{MessageAttributes.MESSAGE_ROLE}",
+        message.get("role", ""),
+    )
+    yield (
+        f"{SpanAttributes.LLM_OUTPUT_MESSAGES}.0.{MessageAttributes.MESSAGE_CONTENT}",
+        message.get("content", ""),
+    )
+
+
+# pylint: disable=too-few-public-methods,disable=missing-function-docstring
 class Pipeline:
+    """A filter pipeline for Phoenix integration."""
+
     class Valves(BaseModel):
+        """Valve settings for the Phoenix filter pipeline."""
+
         # List target pipeline ids (models) that this filter will be connected to.
         # If you want to connect this filter to all pipelines, you can set pipelines to ["*"]
         # e.g. ["llama3:latest", "gpt-3.5-turbo"]
-        pipelines: List[str] = []
+        pipelines: list[str] = []
 
         # Assign a priority level to the filter pipeline.
         # The priority level determines the order in which the filter pipelines are executed.
         # The lower the number, the higher the priority.
         priority: int = 0
 
-    def __init__(self):
+        # Add your custom parameters here
+        debug: bool = False
+
+    def __init__(self) -> None:
         # Pipeline filters are only compatible with Open WebUI
-        # You can think of filter pipeline as a middleware that can be used to edit the form data before it is sent to the OpenAI API.
+        # You can think of filter pipeline as a middleware that can be used to
+        # edit the form data before it is sent to the OpenAI API.
         self.type = "filter"
 
         # Optionally, you can set the id and name of the pipeline.
-        # Best practice is to not specify the id so that it can be automatically inferred from the filename, so that users can install multiple versions of the same pipeline.
+        # Best practice is to not specify the id so that it can be automatically
+        # inferred from the filename, so that users can install multiple versions
+        # of the same pipeline.
         # The identifier must be unique across all pipelines.
-        # The identifier must be an alphanumeric string that can include underscores or hyphens. It cannot contain spaces, special characters, slashes, or backslashes.
+        # The identifier must be an alphanumeric string that can include underscores or hyphens.
+        # It cannot contain spaces, special characters, slashes, or backslashes.
         # self.id = "phoenix_filter_pipeline"
         self.name = "Phoenix Filter"
 
         # Initialize
         self.valves = self.Valves(
-            **{
-                "pipelines": ["*"],  # Connect to all pipelines
-            }
+            pipelines=["*"],  # Connect to all pipelines
+            priority=0,
+            debug=False,
         )
 
-        self.tracer = None
+        self._debug = self.valves.debug
+
+        self._tracer: OITracer | None = None
 
-    async def on_startup(self):
+        self._spans: dict[str, dict[str, Span]] = {
+            "response_generation": {},
+            "follow_up_generation": {},
+            "title_generation": {},
+            "tags_generation": {},
+        }
+
+    async def on_startup(self) -> None:
         # This function is called when the server is started.
-        print(f"on_startup: {__name__}")
+        logger.info("on_startup: %s, valves: %s", __name__, self.valves)
         self._set_tracer()
 
-    async def on_shutdown(self):
+    async def on_shutdown(self) -> None:
         # This function is called when the server is stopped.
-        print(f"on_shutdown: {__name__}")
+        logger.info("on_shutdown: %s", __name__)
+        try:
+            for spans in self._spans.values():
+                for span in spans.values():
+                    span.end()
+        except Exception as e:  # pylint: disable=broad-except
+            logger.error("Error occurred during shutdown: %s", e)
 
-    async def on_valves_updated(self):
+    async def on_valves_updated(self) -> None:
         # This function is called when the valves are updated.
-        print(f"on_valves_updated: {__name__}")
-        # reset tracer
-        self._set_tracer()
+        logger.info("on_valves_updated: %s, valves: %s", __name__, self.valves)
+        self._debug = self.valves.debug
 
-    async def inlet(self, body: dict, user: Optional[dict] = None) -> dict:
+    # pylint: disable=too-many-locals
+    async def inlet(
+        self, body: dict[str, Any], user: dict[str, Any] | None = None
+    ) -> dict[str, Any]:
         # This filter is applied to the form data before it is sent to the OpenAI API.
-        print(f"inlet: {__name__}")
-
-        if self.tracer is None:
-            print("[WARNING] tracer is initialized")
+        if self._tracer is None:
+            logger.warning("tracer is not initialized")
             return body
 
-        print(f"Inlet function called with body: {body} and user: {user}")
+        if self._debug:
+            logger.info(
+                "%s inlet function called with body: %s and user: %s",
+                __name__,
+                body,
+                user,
+            )
 
-        user_message = body["messages"][-1]["content"]
-        with self.tracer.start_as_current_span("inlet") as span:
-            span.set_attribute("user.id", user.get("id", "unknown") if user else "unknown")
-            span.set_attribute("user_message.length", len(user_message))
-            span.set_attribute("user_message.content", user_message[:100])
+        required_keys = ["model", "messages", "metadata"]
+        missing_keys = [key for key in required_keys if key not in body]
+        if missing_keys:
+            error_message = f"Error: Missing keys in the request body: {missing_keys}"
+            raise ValueError(error_message)
 
-        return body
+        metadata = body.get("metadata")
+        if metadata is None:
+            raise ValueError("Error: Missing metadata in the request body")
+
+        message_id = metadata.get("message_id")
+        if message_id is None:
+            raise ValueError("Error: Missing message_id in metadata")
+
+        chat_id = metadata.get("chat_id")
+        # Handle temporary chats
+        if chat_id is None or chat_id == "local":
+            session_id = metadata.get("session_id")
+            chat_id = f"temporary-session-{session_id}"
+            metadata["chat_id"] = chat_id
+            body["metadata"] = metadata
+
+        # task type
+        task = metadata.get("task", "response_generation")
+
+        # model
+        model_info = metadata.get("model", {})
+        model_id = body.get("model", model_info.get("id", "unknown"))
+
+        messages = body.get("messages", [])
+
+        # Inject system message from metadata if present, avoid duplicates
+        if task == "response_generation":
+            system_content = model_info.get("info", {}).get("params", {}).get("system")
+            if system_content:
+                # Remove all existing system messages
+                messages = [m for m in messages if m.get("role") != "system"]
+                system_message = {
+                    "role": "system",
+                    "content": system_content,
+                }
+                messages = [system_message] + messages
+
+        openai_payload = {
+            "model": model_id,
+            "messages": messages,
+        }
+
+        # TODO: follow_up_generation, title_generation, tags_generation tasks
+        # are missing outlet, so we end the span here for now
+        end_on_exit = task != "response_generation"
+
+        with using_attributes(
+            session_id=chat_id,
+            user_id=user.get("name", "unknown") if user else "unknown",
+        ):
+
+            if message_id in self._spans[task]:
+                span = self._spans[task][message_id]
+            else:
+                span = self._tracer.start_span(name=task)
+                self._spans[task][message_id] = span
 
-    async def outlet(self, body: dict, user: Optional[dict] = None) -> dict:
-        print(f"outlet: {__name__}")
+            with use_span(span, end_on_exit=end_on_exit):
+                for attribute_key, attribute_value in (
+                    *_metadata_attributes(metadata),
+                    *_input_attributes(openai_payload),
+                    *_llm_span_kind_attributes(),
+                    *_llm_model_name_attributes(model_id),
+                    *_llm_input_messages_attributes(messages),
+                ):
+                    span.set_attribute(attribute_key, attribute_value)
 
-        if self.tracer is None:
-            print("[WARNING] tracer is initialized")
+        if end_on_exit:
+            self._spans[task].pop(message_id, None)
+
+        return body
+
+    # pylint: disable=too-many-locals
+    async def outlet(
+        self, body: dict[str, Any], user: dict[str, Any] | None = None
+    ) -> dict[str, Any]:
+        if self._tracer is None:
+            logger.warning("tracer is not initialized")
             return body
 
-        print(f"Outlet function called with body: {body} and user: {user}")
+        if self._debug:
+            logger.info(
+                "%s outlet function called with body: %s and user: %s",
+                __name__,
+                body,
+                user,
+            )
+
+        required_keys = ["messages", "id"]
+        missing_keys = [key for key in required_keys if key not in body]
+        if missing_keys:
+            error_message = f"Error: Missing keys in the response body: {missing_keys}"
+            raise ValueError(error_message)
+
+        message_id = body.get("id")
+        if message_id is None:
+            raise ValueError("Error: Missing id in the response body")
+
+        chat_id = body.get("chat_id")
+        # Handle temporary chats
+        if chat_id is None or chat_id == "local":
+            session_id = body.get("session_id")
+            chat_id = f"temporary-session-{session_id}"
+            body["chat_id"] = chat_id
+
+        messages = body.get("messages")
+        _assistant_message = messages[-1] if messages else {}
+        if _assistant_message and _assistant_message.get("role") == "assistant":
+            assistant_message = {
+                "role": "assistant",
+                "content": _assistant_message.get("content"),
+            }
+        else:
+            assistant_message = {
+                "role": "assistant",
+                "content": "",
+            }
+
+        # task type
+        task = body.get("task", "response_generation")
+
+        with using_attributes(
+            session_id=chat_id,
+            user_id=user.get("name", "unknown") if user else "unknown",
+        ):
+
+            if message_id in self._spans[task]:
+                span = self._spans[task][message_id]
+            else:
+                span = self._tracer.start_span(name=task)
+                self._spans[task][message_id] = span
+
+            with use_span(span, end_on_exit=True):
+                for attribute_key, attribute_value in (
+                    *_llm_span_kind_attributes(),
+                    *_output_attributes(body),
+                    *_llm_output_message_attributes(assistant_message),
+                ):
+                    span.set_attribute(attribute_key, attribute_value)
 
-        with self.tracer.start_as_current_span("outlet") as span:
-            span.set_attribute("user.id", user.get("id", "unknown") if user else "unknown")
+        self._spans[task].pop(message_id, None)
 
         return body
 
@@ -107,4 +382,4 @@ def _set_tracer(self) -> None:
             batch=True,
         )
 
-        self.tracer = tracer_provider.get_tracer(__name__)
\ No newline at end of file
+        self._tracer = tracer_provider.get_tracer(__name__)

From db8192372c01c6301f630e2d3f04d123c7e59494 Mon Sep 17 00:00:00 2001
From: Frank Deng <dengjia@gmail.com>
Date: Wed, 10 Sep 2025 13:49:14 -0700
Subject: [PATCH 3/3] Update author name/email

---
 examples/filters/phoenix_pipeline.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/examples/filters/phoenix_pipeline.py b/examples/filters/phoenix_pipeline.py
index 6b764db1..bdea77c5 100644
--- a/examples/filters/phoenix_pipeline.py
+++ b/examples/filters/phoenix_pipeline.py
@@ -1,6 +1,6 @@
 """
 title: Phoenix Filter Pipeline
-author: jia.deng@cloudkitchens.com
+author:  Frank Deng <dengjia@gmail.com>
 date: 2025-09-09
 version: 1.0
 license: MIT