updates with json helper

filintod · filintod · commit 2e164a1c80dc · 2025-06-20T09:58:01.000-05:00
Signed-off-by: Filinto Duran &lt;1373693+filintod@users.noreply.github.com&gt;
diff --git a/dapr/aio/clients/grpc/client.py b/dapr/aio/clients/grpc/client.py
@@ -1853,6 +1853,99 @@ async def converse_stream_alpha1(
         except grpc.aio.AioRpcError as err:
             raise DaprGrpcError(err) from err
 
+    async def converse_stream_json(
+        self,
+        name: str,
+        inputs: List[ConversationInput],
+        *,
+        context_id: Optional[str] = None,
+        parameters: Optional[Dict[str, GrpcAny]] = None,
+        metadata: Optional[Dict[str, str]] = None,
+        scrub_pii: Optional[bool] = None,
+        temperature: Optional[float] = None,
+    ) -> AsyncIterator[Dict[str, Any]]:
+        """Invoke an LLM using the streaming conversation API with JSON response format (Alpha).
+
+        This method provides a JSON-formatted streaming interface that's compatible with
+        common LLM response formats, making it easier to integrate with existing tools
+        and frameworks that expect JSON responses.
+
+        Args:
+            name: Name of the LLM component to invoke
+            inputs: List of conversation inputs
+            context_id: Optional ID for continuing an existing chat
+            parameters: Optional custom parameters for the request
+            metadata: Optional metadata for the component
+            scrub_pii: Optional flag to scrub PII from inputs and outputs
+            temperature: Optional temperature setting for the LLM to optimize for creativity or predictability
+
+        Yields:
+            Dict[str, Any]: JSON-formatted conversation response chunks with structure:
+                {
+                    "choices": [
+                        {
+                            "delta": {
+                                "content": "chunk content",
+                                "role": "assistant"
+                            },
+                            "index": 0,
+                            "finish_reason": None
+                        }
+                    ],
+                    "context_id": "optional context ID",
+                    "usage": {
+                        "prompt_tokens": 0,
+                        "completion_tokens": 0,
+                        "total_tokens": 0
+                    }
+                }
+
+        Raises:
+            DaprGrpcError: If the Dapr runtime returns an error
+        """
+        async for chunk in self.converse_stream_alpha1(
+            name=name,
+            inputs=inputs,
+            context_id=context_id,
+            parameters=parameters,
+            metadata=metadata,
+            scrub_pii=scrub_pii,
+            temperature=temperature,
+        ):
+            # Transform the chunk to JSON format compatible with common LLM APIs
+            chunk_dict = {
+                'choices': [],
+                'context_id': None,
+                'usage': None,
+            }
+
+            # Handle streaming result chunks
+            if chunk.result and chunk.result.result:
+                chunk_dict['choices'] = [
+                    {
+                        'delta': {
+                            'content': chunk.result.result,
+                            'role': 'assistant'
+                        },
+                        'index': 0,
+                        'finish_reason': None
+                    }
+                ]
+
+            # Handle context ID
+            if chunk.context_id:
+                chunk_dict['context_id'] = chunk.context_id
+
+            # Handle usage information (typically in the final chunk)
+            if chunk.usage:
+                chunk_dict['usage'] = {
+                    'prompt_tokens': chunk.usage.prompt_tokens,
+                    'completion_tokens': chunk.usage.completion_tokens,
+                    'total_tokens': chunk.usage.total_tokens,
+                }
+
+            yield chunk_dict
+
     async def wait(self, timeout_s: float):
         """Waits for sidecar to be available within the timeout.
 
diff --git a/dapr/clients/grpc/client.py b/dapr/clients/grpc/client.py
@@ -1855,6 +1855,99 @@ def converse_stream_alpha1(
         except RpcError as err:
             raise DaprGrpcError(err) from err
 
+    def converse_stream_json(
+        self,
+        name: str,
+        inputs: List[ConversationInput],
+        *,
+        context_id: Optional[str] = None,
+        parameters: Optional[Dict[str, GrpcAny]] = None,
+        metadata: Optional[Dict[str, str]] = None,
+        scrub_pii: Optional[bool] = None,
+        temperature: Optional[float] = None,
+    ) -> Iterator[Dict[str, Any]]:
+        """Invoke an LLM using the streaming conversation API with JSON response format (Alpha).
+
+        This method provides a JSON-formatted streaming interface that's compatible with
+        common LLM response formats, making it easier to integrate with existing tools
+        and frameworks that expect JSON responses.
+
+        Args:
+            name: Name of the LLM component to invoke
+            inputs: List of conversation inputs
+            context_id: Optional ID for continuing an existing chat
+            parameters: Optional custom parameters for the request
+            metadata: Optional metadata for the component
+            scrub_pii: Optional flag to scrub PII from inputs and outputs
+            temperature: Optional temperature setting for the LLM to optimize for creativity or predictability
+
+        Yields:
+            Dict[str, Any]: JSON-formatted conversation response chunks with structure:
+                {
+                    "choices": [
+                        {
+                            "delta": {
+                                "content": "chunk content",
+                                "role": "assistant"
+                            },
+                            "index": 0,
+                            "finish_reason": None
+                        }
+                    ],
+                    "context_id": "optional context ID",
+                    "usage": {
+                        "prompt_tokens": 0,
+                        "completion_tokens": 0,
+                        "total_tokens": 0
+                    }
+                }
+
+        Raises:
+            DaprGrpcError: If the Dapr runtime returns an error
+        """
+        for chunk in self.converse_stream_alpha1(
+            name=name,
+            inputs=inputs,
+            context_id=context_id,
+            parameters=parameters,
+            metadata=metadata,
+            scrub_pii=scrub_pii,
+            temperature=temperature,
+        ):
+            # Transform the chunk to JSON format compatible with common LLM APIs
+            chunk_dict = {
+                'choices': [],
+                'context_id': None,
+                'usage': None,
+            }
+
+            # Handle streaming result chunks
+            if chunk.result and chunk.result.result:
+                chunk_dict['choices'] = [
+                    {
+                        'delta': {
+                            'content': chunk.result.result,
+                            'role': 'assistant'
+                        },
+                        'index': 0,
+                        'finish_reason': None
+                    }
+                ]
+
+            # Handle context ID
+            if chunk.context_id:
+                chunk_dict['context_id'] = chunk.context_id
+
+            # Handle usage information (typically in the final chunk)
+            if chunk.usage:
+                chunk_dict['usage'] = {
+                    'prompt_tokens': chunk.usage.prompt_tokens,
+                    'completion_tokens': chunk.usage.completion_tokens,
+                    'total_tokens': chunk.usage.total_tokens,
+                }
+
+            yield chunk_dict
+
     def wait(self, timeout_s: float):
         """Waits for sidecar to be available within the timeout.
 
diff --git a/examples/conversation/streaming_json_example.py b/examples/conversation/streaming_json_example.py
@@ -0,0 +1,117 @@
+#!/usr/bin/env python3
+
+"""
+Example demonstrating the new converse_stream_json API.
+
+This example shows how to use the new JSON-formatted streaming conversation API
+that provides responses compatible with common LLM response formats, making it
+easier to integrate with existing tools and frameworks.
+
+Prerequisites:
+- Dapr sidecar running with conversation components
+- Use tools/run_dapr_dev.py to start a development sidecar with echo component
+"""
+
+import asyncio
+
+from dapr.aio.clients import DaprClient as AsyncDaprClient
+from dapr.clients import DaprClient
+from dapr.clients.grpc._request import ConversationInput
+
+
+def sync_json_streaming_example():
+    """Demonstrate synchronous JSON streaming conversation."""
+    print('🚀 Testing synchronous JSON streaming conversation...')
+
+    with DaprClient() as d:
+        print('✓ Connected to Dapr sidecar')
+
+        inputs = [ConversationInput(content='Hello from JSON streaming test!', role='user')]
+
+        print('\n📡 Streaming with JSON format...')
+        for chunk in d.converse_stream_json(
+            name='echo', inputs=inputs, context_id='json-test-session'
+        ):
+            print(f'📦 JSON chunk: {chunk}')
+
+            # Extract content from the JSON structure
+            choices = chunk.get('choices', [])
+            if choices and choices[0].get('delta', {}).get('content'):
+                content = choices[0]['delta']['content']
+                print(f'   Content: "{content}"')
+
+            # Check for context ID
+            if chunk.get('context_id'):
+                print(f'   Context ID: {chunk["context_id"]}')
+
+            # Check for usage information
+            if chunk.get('usage'):
+                usage = chunk['usage']
+                prompt_tokens = usage['prompt_tokens']
+                completion_tokens = usage['completion_tokens']
+                total_tokens = usage['total_tokens']
+                print(f'   Usage: {prompt_tokens} + {completion_tokens} = {total_tokens} tokens')
+
+
+async def async_json_streaming_example():
+    """Demonstrate asynchronous JSON streaming conversation."""
+    print('\n🧪 Testing asynchronous JSON streaming conversation...')
+
+    async with AsyncDaprClient() as d:
+        print('✓ Connected to Dapr sidecar (async)')
+
+        inputs = [ConversationInput(content='Hello from async JSON streaming test!', role='user')]
+
+        print('\n📡 Async streaming with JSON format...')
+        async for chunk in d.converse_stream_json(
+            name='echo', inputs=inputs, context_id='async-json-test-session'
+        ):
+            print(f'📦 Async JSON chunk: {chunk}')
+
+            # Extract content from the JSON structure
+            choices = chunk.get('choices', [])
+            if choices and choices[0].get('delta', {}).get('content'):
+                content = choices[0]['delta']['content']
+                print(f'   Async Content: "{content}"')
+
+            # Check for context ID
+            if chunk.get('context_id'):
+                print(f'   Async Context ID: {chunk["context_id"]}')
+
+            # Check for usage information
+            if chunk.get('usage'):
+                usage = chunk['usage']
+                prompt_tokens = usage['prompt_tokens']
+                completion_tokens = usage['completion_tokens']
+                total_tokens = usage['total_tokens']
+                usage_parts = [
+                    f'   Async Usage: {prompt_tokens}',
+                    f'{completion_tokens}',
+                    f'{total_tokens} tokens',
+                ]
+                print(' + '.join(usage_parts[:2]) + ' = ' + usage_parts[2])
+
+
+def main():
+    """Run both sync and async examples."""
+    try:
+        # Run synchronous example
+        sync_json_streaming_example()
+
+        # Run asynchronous example
+        asyncio.run(async_json_streaming_example())
+
+        print('\n✅ JSON streaming examples completed successfully!')
+        json_compat_msg = '\n💡 The JSON format is compatible with common LLM APIs like OpenAI.'
+        integration_msg = '   This makes it easier to integrate with existing tools and frameworks.'
+        print(json_compat_msg)
+        print(integration_msg)
+
+    except Exception as e:
+        print(f'❌ Error: {e}')
+        print('\n💡 Make sure to start the Dapr sidecar with:')
+        print('   python tools/run_dapr_dev.py')
+
+
+if __name__ == '__main__':
+    main()