From c0d6445af721d2c4f08d51ed5342cfc2288a4fd1 Mon Sep 17 00:00:00 2001
From: yaron2 <schneider.yaron@live.com>
Date: Fri, 21 Feb 2025 08:38:55 -0800
Subject: [PATCH 1/4] add dapr conversation api as llm inference

Signed-off-by: yaron2 <schneider.yaron@live.com>
---
 dapr_agents/llm/__init__.py      |   3 +-
 dapr_agents/llm/dapr/__init__.py |   2 +
 dapr_agents/llm/dapr/chat.py     | 122 +++++++++++++++++++++++++++++++
 dapr_agents/llm/dapr/client.py   |  87 ++++++++++++++++++++++
 dapr_agents/types/llm.py         |   8 ++
 5 files changed, 221 insertions(+), 1 deletion(-)
 create mode 100644 dapr_agents/llm/dapr/__init__.py
 create mode 100644 dapr_agents/llm/dapr/chat.py
 create mode 100644 dapr_agents/llm/dapr/client.py

diff --git a/dapr_agents/llm/__init__.py b/dapr_agents/llm/__init__.py
index 1f7613c0..90a3060b 100644
--- a/dapr_agents/llm/__init__.py
+++ b/dapr_agents/llm/__init__.py
@@ -9,4 +9,5 @@
 from .nvidia.client import NVIDIAClientBase
 from .nvidia.chat import NVIDIAChatClient
 from .nvidia.embeddings import NVIDIAEmbeddingClient
-from .elevenlabs import ElevenLabsSpeechClient
\ No newline at end of file
+from .elevenlabs import ElevenLabsSpeechClient
+from .dapr import DaprChatClient
\ No newline at end of file
diff --git a/dapr_agents/llm/dapr/__init__.py b/dapr_agents/llm/dapr/__init__.py
new file mode 100644
index 00000000..40b69cd1
--- /dev/null
+++ b/dapr_agents/llm/dapr/__init__.py
@@ -0,0 +1,2 @@
+from .chat import DaprChatClient
+from .client import DaprInferenceClientBase
\ No newline at end of file
diff --git a/dapr_agents/llm/dapr/chat.py b/dapr_agents/llm/dapr/chat.py
new file mode 100644
index 00000000..8bdbdcca
--- /dev/null
+++ b/dapr_agents/llm/dapr/chat.py
@@ -0,0 +1,122 @@
+from dapr_agents.llm.dapr.client import DaprInferenceClientBase
+from dapr_agents.llm.utils import RequestHandler, ResponseHandler
+from dapr_agents.prompt.prompty import Prompty
+from dapr_agents.types.message import BaseMessage
+from dapr_agents.llm.chat import ChatClientBase
+from dapr_agents.tool import AgentTool
+from typing import Union, Optional, Iterable, Dict, Any, List, Iterator, Type
+from pydantic import BaseModel
+from pathlib import Path
+import logging
+import os
+
+logger = logging.getLogger(__name__)
+
+class DaprChatClient(DaprInferenceClientBase, ChatClientBase):
+    """
+    Concrete class for Dapr's chat completion API using the Inference API.
+    This class extends the ChatClientBase.
+    """
+
+    def model_post_init(self, __context: Any) -> None:
+        """
+        Initializes private attributes for provider, api, config, and client after validation.
+        """
+        # Set the private provider and api attributes
+        self._api = "chat"
+        self._llm_component = os.environ['DAPR_LLM_COMPONENT_DEFAULT']
+
+        return super().model_post_init(__context)
+
+    @classmethod
+    def from_prompty(cls, prompty_source: Union[str, Path], timeout: Union[int, float, Dict[str, Any]] = 1500) -> 'DaprChatClient':
+        """
+        Initializes an DaprChatClient client using a Prompty source, which can be a file path or inline content.
+        
+        Args:
+            prompty_source (Union[str, Path]): The source of the Prompty file, which can be a path to a file 
+                or inline Prompty content as a string.
+            timeout (Union[int, float, Dict[str, Any]], optional): Timeout for requests, defaults to 1500 seconds.
+
+        Returns:
+            DaprChatClient: An instance of DaprChatClient configured with the model settings from the Prompty source.
+        """
+        # Load the Prompty instance from the provided source
+        prompty_instance = Prompty.load(prompty_source)
+
+        # Generate the prompt template from the Prompty instance
+        prompt_template = Prompty.to_prompt_template(prompty_instance)
+
+        # Extract the model configuration from Prompty
+        model_config = prompty_instance.model
+
+        # Initialize the DaprChatClient based on the Prompty model configuration
+        return cls.model_validate({
+            'timeout': timeout,
+            'prompty': prompty_instance,
+            'prompt_template': prompt_template,
+        })
+
+    def generate(
+        self,
+        messages: Union[str, Dict[str, Any], BaseMessage, Iterable[Union[Dict[str, Any], BaseMessage]]] = None,
+        input_data: Optional[Dict[str, Any]] = None,
+        llm_component: Optional[str] = None,
+        tools: Optional[List[Union[AgentTool, Dict[str, Any]]]] = None,
+        response_model: Optional[Type[BaseModel]] = None,
+        scrubPII: Optional[bool] = False,
+        **kwargs
+    ) -> Union[Iterator[Dict[str, Any]], Dict[str, Any]]:
+        """
+        Generate chat completions based on provided messages or input_data for prompt templates.
+
+        Args:
+            messages (Optional): Either pre-set messages or None if using input_data.
+            input_data (Optional[Dict[str, Any]]): Input variables for prompt templates.
+            llm_component (str): Name of the LLM component to use for the request.
+            tools (List[Union[AgentTool, Dict[str, Any]]]): List of tools for the request.
+            response_model (Type[BaseModel]): Optional Pydantic model for structured response parsing.
+            scrubPII (Type[bool]): Optional flag to obfuscate any sensitive information coming back from the LLM.
+            **kwargs: Additional parameters for the language model.
+
+        Returns:
+            Union[Iterator[Dict[str, Any]], Dict[str, Any]]: The chat completion response(s).
+        """
+        
+        # If input_data is provided, check for a prompt_template
+        if input_data:
+            if not self.prompt_template:
+                raise ValueError("Inputs are provided but no 'prompt_template' is set. Please set a 'prompt_template' to use the input_data.")
+            
+            logger.info("Using prompt template to generate messages.")
+            messages = self.prompt_template.format_prompt(**input_data)
+
+        # Ensure we have messages at this point
+        if not messages:
+            raise ValueError("Either 'messages' or 'input_data' must be provided.")
+
+        # Process and normalize the messages
+        params = {'messages': RequestHandler.normalize_chat_messages(messages)}
+
+        # Merge Prompty parameters if available, then override with any explicit kwargs
+        if self.prompty:
+            params = {**self.prompty.model.parameters.model_dump(), **params, **kwargs}
+        else:
+            params.update(kwargs)
+
+        # If a model is provided, override the default model
+        params['llm_component'] = llm_component or self._llm_component
+        params['scrubPII'] = scrubPII
+
+        # Prepare and send the request
+        params = RequestHandler.process_params(params, llm_provider=self.provider, tools=tools, response_model=response_model)
+
+        try:
+            logger.info("Invoking the Dapr Conversation API.")
+            response = self.client.chat_completion(**params)
+            logger.info("Chat completion retrieved successfully.")
+
+            return ResponseHandler.process_response(response, llm_provider=self.provider, response_model=response_model, stream=params.get('stream', False))
+        except Exception as e:
+            logger.error(f"An error occurred during the Dapr Conversation API call: {e}")
+            raise
\ No newline at end of file
diff --git a/dapr_agents/llm/dapr/client.py b/dapr_agents/llm/dapr/client.py
new file mode 100644
index 00000000..24fb8707
--- /dev/null
+++ b/dapr_agents/llm/dapr/client.py
@@ -0,0 +1,87 @@
+from dapr_agents.types.llm import DaprInferenceClientConfig
+from dapr_agents.llm.base import LLMClientBase
+from typing import Optional, Dict, Any, List
+from pydantic import Field, model_validator
+import os
+import logging
+import requests
+import json
+
+logger = logging.getLogger(__name__)
+
+class DaprClient:
+    def __init__(self):
+        self._dapr_endpoint = os.getenv('DAPR_BASE_URL', 'http://localhost') + ':' + os.getenv(
+                    'DAPR_HTTP_PORT', '3500')
+
+    def chat_completion(self, llm: str, request: List[Dict]) -> Any:
+        messages = request['messages']
+        scrubPII = request['scrubPII']
+
+        conversation_request = {
+            "inputs": messages,
+            "scrubPII": scrubPII
+        }
+
+        # Invoke Dapr
+        result = requests.post(
+            url='%s/v1.0-alpha1/conversation/%s/converse' % (self._dapr_endpoint, llm),
+            data=json.dumps(conversation_request)
+        )
+
+        return result.json()
+
+class DaprInferenceClientBase(LLMClientBase):
+    """
+    Base class for managing Dapr Inference API clients.
+    Handles client initialization, configuration, and shared logic.
+    """
+    @model_validator(mode="before")
+    def validate_and_initialize(cls, values: Dict[str, Any]) -> Dict[str, Any]:
+        return values
+
+    def model_post_init(self, __context: Any) -> None:
+        """
+        Initializes private attributes after validation.
+        """
+        self._provider = "dapr"
+
+        # Set up the private config and client attributes
+        self._config = self.get_config()
+        self._client = self.get_client()
+        return super().model_post_init(__context)
+    
+    def get_config(self) -> DaprInferenceClientConfig:
+        """
+        Returns the appropriate configuration for the Dapr Conversation API.
+        """
+        return DaprInferenceClientConfig()
+
+    def get_client(self) -> DaprClient:
+        """
+        Initializes and returns the Dapr Inference client.
+        """
+        config: DaprInferenceClientConfig = self.config
+        return DaprClient()
+    
+    @classmethod
+    def from_config(cls, client_options: DaprInferenceClientConfig, timeout: float = 1500):
+        """
+        Initializes the DaprInferenceClientBase using DaprInferenceClientConfig.
+
+        Args:
+            client_options: The configuration options for the client.
+            timeout: Timeout for requests (default is 1500 seconds).
+
+        Returns:
+            DaprInferenceClientBase: The initialized client instance.
+        """
+        return cls()
+
+    @property
+    def config(self) -> Dict[str, Any]:
+        return self._config
+
+    @property
+    def client(self) -> DaprClient:
+        return self._client
diff --git a/dapr_agents/types/llm.py b/dapr_agents/types/llm.py
index 770c6041..2a2fc5e1 100644
--- a/dapr_agents/types/llm.py
+++ b/dapr_agents/types/llm.py
@@ -31,6 +31,14 @@ def none_to_default(cls, v):
             raise PydanticUseDefault()
         return v
 
+class DaprInferenceClientConfig:
+    @field_validator("*", mode="before")
+    @classmethod
+    def none_to_default(cls, v):
+        if v is None:
+            raise PydanticUseDefault()
+        return v
+    
 class HFInferenceClientConfig(BaseModel):
     model: Optional[str] = Field(None, description="Model ID on Hugging Face Hub or URL to a deployed Inference Endpoint. Defaults to a recommended model if not provided.")
     api_key: Optional[Union[str, bool]] = Field(None, description="Hugging Face API key for authentication. Defaults to the locally saved token. Pass False to skip token.")

From dd9e961b358bbeb335536a9b399b15cc11f3fbbc Mon Sep 17 00:00:00 2001
From: yaron2 <schneider.yaron@live.com>
Date: Fri, 21 Feb 2025 11:45:29 -0800
Subject: [PATCH 2/4] add response parsing

Signed-off-by: yaron2 <schneider.yaron@live.com>
---
 dapr_agents/llm/dapr/chat.py   | 34 ++++++++++++++++++++++++++++------
 dapr_agents/llm/dapr/client.py | 12 ++----------
 2 files changed, 30 insertions(+), 16 deletions(-)

diff --git a/dapr_agents/llm/dapr/chat.py b/dapr_agents/llm/dapr/chat.py
index 8bdbdcca..308ac63b 100644
--- a/dapr_agents/llm/dapr/chat.py
+++ b/dapr_agents/llm/dapr/chat.py
@@ -9,6 +9,7 @@
 from pathlib import Path
 import logging
 import os
+import time
 
 logger = logging.getLogger(__name__)
 
@@ -57,6 +58,29 @@ def from_prompty(cls, prompty_source: Union[str, Path], timeout: Union[int, floa
             'prompt_template': prompt_template,
         })
 
+    def translate_response(self, response: dict, model: str) -> dict:
+        """Converts a Dapr response dict into a structure compatible with Choice and ChatCompletion."""
+        choices = [
+            {
+                "finish_reason": "stop",
+                "index": i,
+                "message": {
+                    "content": output["result"],
+                    "role": "assistant"
+                },
+                "logprobs": None
+            }
+            for i, output in enumerate(response.get("outputs", []))
+        ]
+        
+        return {
+            "choices": choices,
+            "created": int(time.time()),
+            "model": model,
+            "object": "chat.completion",
+            "usage": {"total_tokens": len(response.get("outputs", []))}
+        }
+
     def generate(
         self,
         messages: Union[str, Dict[str, Any], BaseMessage, Iterable[Union[Dict[str, Any], BaseMessage]]] = None,
@@ -96,16 +120,13 @@ def generate(
             raise ValueError("Either 'messages' or 'input_data' must be provided.")
 
         # Process and normalize the messages
-        params = {'messages': RequestHandler.normalize_chat_messages(messages)}
-
+        params = {'inputs': RequestHandler.normalize_chat_messages(messages)}
         # Merge Prompty parameters if available, then override with any explicit kwargs
         if self.prompty:
             params = {**self.prompty.model.parameters.model_dump(), **params, **kwargs}
         else:
             params.update(kwargs)
 
-        # If a model is provided, override the default model
-        params['llm_component'] = llm_component or self._llm_component
         params['scrubPII'] = scrubPII
 
         # Prepare and send the request
@@ -113,10 +134,11 @@ def generate(
 
         try:
             logger.info("Invoking the Dapr Conversation API.")
-            response = self.client.chat_completion(**params)
+            response = self.client.chat_completion(llm_component or self._llm_component, params)
+            transposed_response = self.translate_response(response, self._llm_component)
             logger.info("Chat completion retrieved successfully.")
 
-            return ResponseHandler.process_response(response, llm_provider=self.provider, response_model=response_model, stream=params.get('stream', False))
+            return ResponseHandler.process_response(transposed_response, llm_provider=self.provider, response_model=response_model, stream=params.get('stream', False))
         except Exception as e:
             logger.error(f"An error occurred during the Dapr Conversation API call: {e}")
             raise
\ No newline at end of file
diff --git a/dapr_agents/llm/dapr/client.py b/dapr_agents/llm/dapr/client.py
index 24fb8707..a62eda22 100644
--- a/dapr_agents/llm/dapr/client.py
+++ b/dapr_agents/llm/dapr/client.py
@@ -15,20 +15,12 @@ def __init__(self):
                     'DAPR_HTTP_PORT', '3500')
 
     def chat_completion(self, llm: str, request: List[Dict]) -> Any:
-        messages = request['messages']
-        scrubPII = request['scrubPII']
-
-        conversation_request = {
-            "inputs": messages,
-            "scrubPII": scrubPII
-        }
-
         # Invoke Dapr
         result = requests.post(
             url='%s/v1.0-alpha1/conversation/%s/converse' % (self._dapr_endpoint, llm),
-            data=json.dumps(conversation_request)
+            data=json.dumps(request)
         )
-
+        
         return result.json()
 
 class DaprInferenceClientBase(LLMClientBase):

From 93c2ede30876267d2e0ecd2c53aa14ed0bf70d1b Mon Sep 17 00:00:00 2001
From: yaron2 <schneider.yaron@live.com>
Date: Mon, 24 Feb 2025 20:16:06 -0800
Subject: [PATCH 3/4] replace http request with dapr client

Signed-off-by: yaron2 <schneider.yaron@live.com>
---
 dapr_agents/llm/dapr/chat.py   | 21 +++++++++++----
 dapr_agents/llm/dapr/client.py | 48 ++++++++++++++++++++--------------
 requirements.txt               |  2 +-
 3 files changed, 45 insertions(+), 26 deletions(-)

diff --git a/dapr_agents/llm/dapr/chat.py b/dapr_agents/llm/dapr/chat.py
index 308ac63b..936a1b14 100644
--- a/dapr_agents/llm/dapr/chat.py
+++ b/dapr_agents/llm/dapr/chat.py
@@ -4,6 +4,7 @@
 from dapr_agents.types.message import BaseMessage
 from dapr_agents.llm.chat import ChatClientBase
 from dapr_agents.tool import AgentTool
+from dapr.clients.grpc._request import ConversationInput
 from typing import Union, Optional, Iterable, Dict, Any, List, Iterator, Type
 from pydantic import BaseModel
 from pathlib import Path
@@ -78,9 +79,19 @@ def translate_response(self, response: dict, model: str) -> dict:
             "created": int(time.time()),
             "model": model,
             "object": "chat.completion",
-            "usage": {"total_tokens": len(response.get("outputs", []))}
+            "usage": {"total_tokens": "-1"}
         }
 
+    def convert_to_conversation_inputs(self, inputs: List[Dict[str, Any]]) -> List[ConversationInput]:
+        return [
+            ConversationInput(
+                content=item["content"],
+                role=item.get("role"),
+                scrub_pii=item.get("scrubPII") == "true" 
+            )
+            for item in inputs
+        ]
+
     def generate(
         self,
         messages: Union[str, Dict[str, Any], BaseMessage, Iterable[Union[Dict[str, Any], BaseMessage]]] = None,
@@ -89,6 +100,7 @@ def generate(
         tools: Optional[List[Union[AgentTool, Dict[str, Any]]]] = None,
         response_model: Optional[Type[BaseModel]] = None,
         scrubPII: Optional[bool] = False,
+        temperature: Optional[float] = None,
         **kwargs
     ) -> Union[Iterator[Dict[str, Any]], Dict[str, Any]]:
         """
@@ -127,14 +139,13 @@ def generate(
         else:
             params.update(kwargs)
 
-        params['scrubPII'] = scrubPII
-
         # Prepare and send the request
         params = RequestHandler.process_params(params, llm_provider=self.provider, tools=tools, response_model=response_model)
-
+        inputs = self.convert_to_conversation_inputs(params['inputs'])
+        
         try:
             logger.info("Invoking the Dapr Conversation API.")
-            response = self.client.chat_completion(llm_component or self._llm_component, params)
+            response = self.client.chat_completion(llm=llm_component or self._llm_component, conversation_inputs=inputs, scrub_pii=scrubPII, temperature=temperature)
             transposed_response = self.translate_response(response, self._llm_component)
             logger.info("Chat completion retrieved successfully.")
 
diff --git a/dapr_agents/llm/dapr/client.py b/dapr_agents/llm/dapr/client.py
index a62eda22..c8bc7994 100644
--- a/dapr_agents/llm/dapr/client.py
+++ b/dapr_agents/llm/dapr/client.py
@@ -1,27 +1,35 @@
 from dapr_agents.types.llm import DaprInferenceClientConfig
 from dapr_agents.llm.base import LLMClientBase
-from typing import Optional, Dict, Any, List
-from pydantic import Field, model_validator
-import os
+from dapr.clients import DaprClient
+from dapr.clients.grpc._request import ConversationInput
+from dapr.clients.grpc._response import ConversationResponse
+from typing import Dict, Any, List
+from pydantic import model_validator
+
 import logging
-import requests
-import json
 
 logger = logging.getLogger(__name__)
 
-class DaprClient:
-    def __init__(self):
-        self._dapr_endpoint = os.getenv('DAPR_BASE_URL', 'http://localhost') + ':' + os.getenv(
-                    'DAPR_HTTP_PORT', '3500')
+class DaprInferenceClient:
+    def translate_to_json(self, response: ConversationResponse) -> dict:
+        response_dict = {
+            "outputs": [
+                {
+                    "result": output.result,
+                }
+                for output in response.outputs
+            ]
+        }
+
+        return response_dict
+    
+    def chat_completion(self, llm: str, conversation_inputs: List[ConversationInput], scrub_pii: bool | None = None, temperature: float | None = None) -> Any:
+        with DaprClient() as client:
+            response = client.converse_alpha1(name=llm, inputs=conversation_inputs, scrub_pii=scrub_pii, temperature=temperature)
+            output = self.translate_to_json(response)
+
+            return output
 
-    def chat_completion(self, llm: str, request: List[Dict]) -> Any:
-        # Invoke Dapr
-        result = requests.post(
-            url='%s/v1.0-alpha1/conversation/%s/converse' % (self._dapr_endpoint, llm),
-            data=json.dumps(request)
-        )
-        
-        return result.json()
 
 class DaprInferenceClientBase(LLMClientBase):
     """
@@ -49,12 +57,12 @@ def get_config(self) -> DaprInferenceClientConfig:
         """
         return DaprInferenceClientConfig()
 
-    def get_client(self) -> DaprClient:
+    def get_client(self) -> DaprInferenceClient:
         """
         Initializes and returns the Dapr Inference client.
         """
         config: DaprInferenceClientConfig = self.config
-        return DaprClient()
+        return DaprInferenceClient()
     
     @classmethod
     def from_config(cls, client_options: DaprInferenceClientConfig, timeout: float = 1500):
@@ -75,5 +83,5 @@ def config(self) -> Dict[str, Any]:
         return self._config
 
     @property
-    def client(self) -> DaprClient:
+    def client(self) -> DaprInferenceClient:
         return self._client
diff --git a/requirements.txt b/requirements.txt
index af31705d..ee4f7fd9 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -5,7 +5,7 @@ openapi-schema-pydantic==1.2.4
 regex>=2023.12.25
 Jinja2==3.1.5
 azure-identity==1.19.0
-dapr==1.14.0
+dapr==1.15.0rc3
 dapr-ext-fastapi==1.14.0
 dapr-ext-workflow==0.5.0
 colorama==0.4.6

From 2cc4d088a669aacae824e7dc57db2210926fcc97 Mon Sep 17 00:00:00 2001
From: yaron2 <schneider.yaron@live.com>
Date: Tue, 25 Feb 2025 14:45:37 -0800
Subject: [PATCH 4/4] address review comments

Signed-off-by: yaron2 <schneider.yaron@live.com>
---
 dapr_agents/llm/dapr/chat.py   | 3 ---
 dapr_agents/llm/dapr/client.py | 1 -
 2 files changed, 4 deletions(-)

diff --git a/dapr_agents/llm/dapr/chat.py b/dapr_agents/llm/dapr/chat.py
index 936a1b14..517e7275 100644
--- a/dapr_agents/llm/dapr/chat.py
+++ b/dapr_agents/llm/dapr/chat.py
@@ -49,9 +49,6 @@ def from_prompty(cls, prompty_source: Union[str, Path], timeout: Union[int, floa
         # Generate the prompt template from the Prompty instance
         prompt_template = Prompty.to_prompt_template(prompty_instance)
 
-        # Extract the model configuration from Prompty
-        model_config = prompty_instance.model
-
         # Initialize the DaprChatClient based on the Prompty model configuration
         return cls.model_validate({
             'timeout': timeout,
diff --git a/dapr_agents/llm/dapr/client.py b/dapr_agents/llm/dapr/client.py
index c8bc7994..f0609f02 100644
--- a/dapr_agents/llm/dapr/client.py
+++ b/dapr_agents/llm/dapr/client.py
@@ -61,7 +61,6 @@ def get_client(self) -> DaprInferenceClient:
         """
         Initializes and returns the Dapr Inference client.
         """
-        config: DaprInferenceClientConfig = self.config
         return DaprInferenceClient()
     
     @classmethod