feat: add llm observability to python sdk

k11kirky · k11kirky · commit cde65a7de715 · 2025-01-09T14:53:14.000-08:00
diff --git a/llm_observability_example.py b/llm_observability_example.py
@@ -0,0 +1,46 @@
+import os
+import uuid
+
+import posthog
+from posthog.ai import OpenAI
+
+# Example credentials - replace these with your own or use environment variables
+posthog.project_api_key = os.getenv("POSTHOG_PROJECT_API_KEY", "your-project-api-key")
+posthog.personal_api_key = os.getenv("POSTHOG_PERSONAL_API_KEY", "your-personal-api-key")
+posthog.host = os.getenv("POSTHOG_HOST", "http://localhost:8000")  # Or https://app.posthog.com
+posthog.debug = True
+
+openai_client = OpenAI(
+    api_key=os.getenv("OPENAI_API_KEY", "your-openai-api-key"),
+    posthog_client=posthog,
+)
+
+def main():
+    trace_id = str(uuid.uuid4())
+    print("Trace ID:", trace_id)
+
+    try:
+        print("Calling OpenAI")
+        response = openai_client.chat.completions.create(
+            model="gpt-4o-mini",
+            messages=[
+                {"role": "system", "content": "You are a complex problem solver."},
+                {"role": "user", "content": "Explain quantum computing in simple terms."},
+            ],
+            max_tokens=100,
+            temperature=0.7,
+            posthog_distinct_id="user_12345",
+            posthog_trace_id=trace_id,
+            posthog_properties={"example_key": "example_value"},
+        )
+        print("RESPONSE:", response)
+
+        if response and response.choices:
+            print("OpenAI response:", response.choices[0].message.content)
+        else:
+            print("No response or unexpected format returned.")
+    except Exception as e:
+        print("Error during OpenAI call:", str(e))
+
+if __name__ == "__main__":
+    main()
diff --git a/llm_observability_stream_example.py b/llm_observability_stream_example.py
@@ -0,0 +1,43 @@
+import os
+import uuid
+
+import posthog
+from posthog.ai import OpenAI
+
+# Example credentials - replace these with your own or use environment variables
+posthog.project_api_key = os.getenv("POSTHOG_PROJECT_API_KEY", "your-project-api-key")
+posthog.personal_api_key = os.getenv("POSTHOG_PERSONAL_API_KEY", "your-personal-api-key")
+posthog.host = os.getenv("POSTHOG_HOST", "http://localhost:8000")  # Or https://app.posthog.com
+posthog.debug = True
+
+openai_client = OpenAI(
+    api_key=os.getenv("OPENAI_API_KEY", "your-openai-api-key"),
+    posthog_client=posthog,
+)
+
+def main():
+    trace_id = str(uuid.uuid4())
+    print("Trace ID:", trace_id)
+
+    try:
+        print("Calling OpenAI")
+        stream = openai_client.chat.completions.create(
+            model="gpt-4o-mini",
+            messages=[
+                {"role": "system", "content": "You are a complex problem solver."},
+                {"role": "user", "content": "Explain quantum computing in simple terms."},
+            ],
+            max_tokens=1000,
+            temperature=0.7,
+            posthog_distinct_id="user_12345",
+            posthog_trace_id=trace_id,
+            posthog_properties={"example_key": "example_value"},
+            stream=True,
+        )
+        for chunk in stream:
+            print(chunk.choices[0].delta.content or "", end="")
+    except Exception as e:
+        print("Error during OpenAI call:", str(e))
+
+if __name__ == "__main__":
+    main()
diff --git a/posthog/ai/__init__.py b/posthog/ai/__init__.py
@@ -0,0 +1,3 @@
+from .openai import OpenAI
+
+__all__ = ["OpenAI"]
diff --git a/posthog/ai/openai.py b/posthog/ai/openai.py
@@ -0,0 +1,147 @@
+import time
+from typing import Any, Dict, Optional, Union
+
+import openai
+from posthog.client import Client as PostHogClient
+
+
+def get_model_params(kwargs: Dict[str, Any]) -> Dict[str, Any]:
+    """
+    Extracts model parameters from the kwargs dictionary.
+    """
+    model_params = {}
+    for param in ["temperature", "max_tokens", "top_p", "frequency_penalty", 
+                "presence_penalty", "n", "stop", "stream"]:
+        if param in kwargs:
+            model_params[param] = kwargs.get(param)
+    return model_params
+
+def get_output(response: openai.types.chat.ChatCompletion) -> Dict[str, Any]:
+    output = {
+        "choices": []
+    }
+    for choice in response.choices:
+        if choice.message.content:
+            output["choices"].append({
+                "content": choice.message.content,
+                "role": choice.message.role,
+            })
+    return output
+
+
+class OpenAI:
+    """
+    A wrapper around the OpenAI SDK that automatically sends LLM usage events to PostHog.
+    """
+
+    def __init__(
+        self,
+        posthog_client: PostHogClient,
+        **openai_config: Any,
+    ):
+        """
+        Args:
+            api_key: OpenAI API key.
+            posthog_client: If provided, events will be captured via this client instance instead 
+                of the global posthog module.
+            **openai_config: Any additional keyword args to set on openai (e.g. organization="xxx").
+        """
+        # Initialize OpenAI client instead of setting global config
+        self._openai_client = openai.OpenAI(**openai_config)
+        self._posthog_client = posthog_client
+
+    @property
+    def chat(self) -> "ChatNamespace":
+        return ChatNamespace(self._posthog_client, self._openai_client)
+
+
+class ChatNamespace:
+    def __init__(self, posthog_client: Union[PostHogClient, Any], openai_client: Any):
+        self._ph_client = posthog_client
+        self._openai_client = openai_client
+
+    @property
+    def completions(self):
+        return ChatCompletions(self._ph_client, self._openai_client)
+
+
+class ChatCompletions:
+
+    def __init__(self, posthog_client: Union[PostHogClient, Any], openai_client: Any):
+        self._ph_client = posthog_client
+        self._openai_client = openai_client
+
+    def create(
+        self,
+        posthog_distinct_id: Optional[str] = None,
+        posthog_trace_id: Optional[str] = None,
+        posthog_properties: Optional[Dict[str, Any]] = None,
+        **kwargs: Any,
+    ):
+        """
+        Wraps open ai chat completions and captures a $ai_generation event in PostHog.
+
+        PostHog-specific parameters:
+            posthog_distinct_id: Ties the resulting event to a user in PostHog.
+            posthog_trace_id: For grouping multiple calls into a single trace.
+            posthog_properties: Additional custom properties to include on the PostHog event.
+        """
+        start_time = time.time()
+        response = None
+        error = None
+        http_status = 200
+        usage: Dict[str, Any] = {}
+
+        try:
+            response = self._openai_client.chat.completions.create(**kwargs)
+        except Exception as exc:
+            error = exc
+            http_status = getattr(exc, 'status_code', 500)
+        finally:
+            end_time = time.time()
+            latency = end_time - start_time
+
+            # Update usage extraction for new response format
+            if response and hasattr(response, "usage"):
+                usage = response.usage.model_dump()
+
+            input_tokens = usage.get("prompt_tokens", 0)
+            output_tokens = usage.get("completion_tokens", 0)
+
+            # Build PostHog event properties
+            event_properties = {
+                "$ai_provider": "openai",
+                "$ai_model": kwargs.get("model"),
+                "$ai_model_parameters": get_model_params(kwargs),
+                "$ai_input": kwargs.get("messages"),
+                "$ai_output": None,
+                "$ai_http_status": http_status,
+                "$ai_input_tokens": input_tokens,
+                "$ai_output_tokens": output_tokens,
+                "$ai_latency": latency,
+                "$ai_trace_id": posthog_trace_id,
+            }
+
+            # If not streaming and no error, try storing some output detail
+            # TODO: we need to support streaming responses
+            stream = kwargs.get("stream", False)
+            if response and not error and not stream:
+                event_properties["$ai_output"] = get_output(response)
+
+            # Merge in any custom PostHog properties
+            if posthog_properties:
+                event_properties.update(posthog_properties)
+
+            # Capture event in PostHog
+            if hasattr(self._ph_client, "capture") and callable(self._ph_client.capture):
+                distinct_id = posthog_distinct_id or "anonymous_ai_user"
+                self._ph_client.capture(
+                    distinct_id=distinct_id,
+                    event="$ai_generation",
+                    properties=event_properties,
+                )
+
+        if error:
+            raise error
+
+        return response
diff --git a/setup.py b/setup.py
@@ -14,7 +14,7 @@
 PostHog is developer-friendly, self-hosted product analytics. posthog-python is the python package.
 """
 
-install_requires = ["requests>=2.7,<3.0", "six>=1.5", "monotonic>=1.5", "backoff>=1.10.0", "python-dateutil>2.1"]
+install_requires = ["requests>=2.7,<3.0", "six>=1.5", "monotonic>=1.5", "backoff>=1.10.0", "python-dateutil>2.1", "openai>=1.59.5"]
 
 extras_require = {
     "dev": [

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+from .openai import OpenAI`
	`2`	`+`
	`3`	`+__all__ = ["OpenAI"]`