Integration tests!

njbrake · njbrake · commit de3fa6d6c527 · 2025-07-15T12:56:56.000-04:00
diff --git a/.github/workflows/tests-integration.yaml b/.github/workflows/tests-integration.yaml
@@ -0,0 +1,31 @@
+name: Integration Tests
+
+on:
+  push:
+    branches: [main]
+    paths:
+      - 'src/**'
+      - 'tests/**'
+  workflow_dispatch:
+
+jobs:
+  run-integration-tests:
+    timeout-minutes: 30
+    runs-on: ubuntu-latest
+
+    steps:
+      - uses: actions/checkout@v4
+
+      - uses: astral-sh/setup-uv@v6
+        with:
+          python-version: 3.13
+          activate-environment: true
+
+      - name: Install dependencies
+        run: |
+          uv sync --group tests --extra all
+
+      - name: Run Integration tests (parallel with xdist)
+        env:
+          MISTRAL_API_KEY: ${{ secrets.MISTRAL_API_KEY }}
+        run: pytest -v tests/integration -n auto
diff --git a/README.md b/README.md
@@ -9,7 +9,8 @@
 # any-llm
 
 [![Docs](https://github.com/mozilla-ai/any-llm/actions/workflows/docs.yaml/badge.svg)](https://github.com/mozilla-ai/any-llm/actions/workflows/docs.yaml/)
-[![Tests](https://github.com/mozilla-ai/any-agent/actions/workflows/tests-unit.yaml/badge.svg)](https://github.com/mozilla-ai/any-agent/actions/workflows/tests-unit.yaml/)
+[![Unit Tests](https://github.com/mozilla-ai/any-llm/actions/workflows/tests-unit.yaml/badge.svg)](https://github.com/mozilla-ai/any-llm/actions/workflows/tests-unit.yaml/)
+[![Integration Tests](https://github.com/mozilla-ai/any-llm/actions/workflows/tests-integration.yaml/badge.svg)](https://github.com/mozilla-ai/any-llm/actions/workflows/tests-integration.yaml/)
 ![Python 3.11+](https://img.shields.io/badge/python-3.11%2B-blue.svg)
 
 A single interface to use and evaluate different llm providers.
@@ -39,7 +40,7 @@ While the OpenAI API has become the de facto standard for LLM provider interface
 `any-llm` fills the gap by providing a simple, well-maintained interface that:
 - **Leverages official provider SDKs** when available, reducing maintenance burden and ensuring compatibility
 - **Stays framework-agnostic** so it can be used across different projects and use cases
-- **Provides active maintenance** we support this in our product ([any-agent](https://github.com/mozilla-ai/any-agent)) so we're motivated to maintain it.
+- **Provides active maintenance** we support this in our product ([any-llm](https://github.com/mozilla-ai/any-llm)) so we're motivated to maintain it.
 
 
 
diff --git a/docs/providers.md b/docs/providers.md
@@ -3,6 +3,8 @@
 `any-llm` supports the following providers:
 
 - [OpenAI](https://platform.openai.com/docs/api-reference)
+- [Anthropic](https://docs.anthropic.com/en/home)
+- [Google](https://cloud.google.com/vertex-ai/docs)
 - [Mistral](https://docs.mistral.ai/)
 - [Ollama](https://github.com/ollama/ollama)
 - [DeepSeek](https://platform.deepseek.com/)
diff --git a/pyproject.toml b/pyproject.toml
@@ -18,7 +18,7 @@ dependencies = [
 [project.optional-dependencies]
 
 all = [
-  "any-llm-sdk[mistral,anthropic]"
+  "any-llm-sdk[mistral,anthropic,google]"
 ]
 
 mistral = [
@@ -29,6 +29,10 @@ anthropic = [
   "anthropic",
 ]
 
+google = [
+  "google-genai",
+]
+
 [project.urls]
 Documentation = "https://mozilla-ai.github.io/any-llm/"
 Issues = "https://github.com/mozilla-ai/any-llm/issues"
@@ -89,6 +93,7 @@ lint = [
 tests = [
   "pytest>=8,<9",
   "mktestdocs>=0.2.4",
+  "pytest-xdist>=3.6.1",
 ]
 
 # For completeness, but 'uv sync --group dev' currently installs the others too.
diff --git a/src/any_llm/providers/google/__init__.py b/src/any_llm/providers/google/__init__.py
@@ -0,0 +1,3 @@
+from .google import GoogleProvider
+
+__all__ = ["GoogleProvider"]
diff --git a/src/any_llm/providers/google/google.py b/src/any_llm/providers/google/google.py
@@ -0,0 +1,265 @@
+import os
+import json
+from typing import Any
+
+try:
+    from google import genai
+    from google.genai import types
+except ImportError:
+    msg = "google-genai is not installed. Please install it with `pip install any-llm-sdk[google]`"
+    raise ImportError(msg)
+
+from openai.types.chat.chat_completion import ChatCompletion, Choice
+from openai.types.completion_usage import CompletionUsage
+from openai.types.chat.chat_completion_message import ChatCompletionMessage
+from openai.types.chat.chat_completion_message_tool_call import ChatCompletionMessageToolCall, Function
+from any_llm.provider import Provider, ApiConfig
+
+DEFAULT_TEMPERATURE = 0.7
+
+
+def _convert_kwargs(kwargs: dict[str, Any]) -> dict[str, Any]:
+    """Format the kwargs for Google GenAI."""
+    kwargs = kwargs.copy()
+
+    # Convert tools if present
+    if "tools" in kwargs:
+        kwargs["tools"] = _convert_tool_spec(kwargs["tools"])
+
+    # Handle unsupported parameters
+    unsupported_params = ["response_format", "parallel_tool_calls"]
+    for param in unsupported_params:
+        if param in kwargs:
+            kwargs.pop(param)
+
+    return kwargs
+
+
+def _convert_tool_spec(openai_tools: list[dict[str, Any]]) -> list[types.Tool]:
+    """Convert OpenAI tool specification to Google GenAI format."""
+    function_declarations = []
+
+    for tool in openai_tools:
+        if tool.get("type") != "function":
+            continue
+
+        function = tool["function"]
+        parameters_dict = {
+            "type": "object",
+            "properties": {
+                param_name: {
+                    "type": param_info.get("type", "string"),
+                    "description": param_info.get("description", ""),
+                    **({"enum": param_info["enum"]} if "enum" in param_info else {}),
+                }
+                for param_name, param_info in function["parameters"]["properties"].items()
+            },
+            "required": function["parameters"].get("required", []),
+        }
+
+        function_declarations.append(
+            types.FunctionDeclaration(
+                name=function["name"],
+                description=function.get("description", ""),
+                parameters=types.Schema(**parameters_dict),
+            )
+        )
+
+    return [types.Tool(function_declarations=function_declarations)]
+
+
+def _convert_messages(messages: list[dict[str, Any]]) -> list[types.Content]:
+    """Convert messages to Google GenAI format."""
+    formatted_messages = []
+
+    for message in messages:
+        if message["role"] == "system":
+            # System messages are treated as user messages in GenAI
+            parts = [types.Part.from_text(text=message["content"])]
+            formatted_messages.append(types.Content(role="user", parts=parts))
+        elif message["role"] == "user":
+            parts = [types.Part.from_text(text=message["content"])]
+            formatted_messages.append(types.Content(role="user", parts=parts))
+        elif message["role"] == "assistant":
+            if "tool_calls" in message and message["tool_calls"]:
+                # Handle function calls
+                tool_call = message["tool_calls"][0]  # Assuming single function call for now
+                function_call = tool_call["function"]
+
+                parts = [
+                    types.Part.from_function_call(
+                        name=function_call["name"], args=json.loads(function_call["arguments"])
+                    )
+                ]
+            else:
+                # Handle regular text messages
+                parts = [types.Part.from_text(text=message["content"])]
+
+            formatted_messages.append(types.Content(role="model", parts=parts))
+        elif message["role"] == "tool":
+            # Convert tool result to function response
+            try:
+                content_json = json.loads(message["content"])
+                part = types.Part.from_function_response(name=message.get("name", "unknown"), response=content_json)
+                formatted_messages.append(types.Content(role="function", parts=[part]))
+            except json.JSONDecodeError:
+                # If not JSON, treat as text
+                part = types.Part.from_function_response(
+                    name=message.get("name", "unknown"), response={"result": message["content"]}
+                )
+                formatted_messages.append(types.Content(role="function", parts=[part]))
+
+    return formatted_messages
+
+
+def _convert_response(response: Any) -> ChatCompletion:
+    """Convert Google GenAI response to OpenAI ChatCompletion format."""
+    # Check if the response contains function calls
+    if (
+        hasattr(response.candidates[0].content.parts[0], "function_call")
+        and response.candidates[0].content.parts[0].function_call
+    ):
+        function_call = response.candidates[0].content.parts[0].function_call
+
+        # Convert the function call arguments to a dictionary
+        args_dict = {}
+        if hasattr(function_call, "args") and function_call.args:
+            for key, value in function_call.args.items():
+                args_dict[key] = value
+
+        tool_calls = [
+            ChatCompletionMessageToolCall(
+                id=f"call_{hash(function_call.name)}",
+                type="function",
+                function=Function(name=function_call.name, arguments=json.dumps(args_dict)),
+            )
+        ]
+
+        message = ChatCompletionMessage(
+            content=None,
+            role="assistant",
+            tool_calls=tool_calls,
+        )
+
+        finish_reason = "tool_calls"
+    else:
+        # Handle regular text response
+        content = response.candidates[0].content.parts[0].text
+        message = ChatCompletionMessage(
+            content=content,
+            role="assistant",
+            tool_calls=None,
+        )
+
+        finish_reason = "stop"
+
+    # Create the choice
+    choice = Choice(
+        finish_reason=finish_reason,  # type: ignore
+        index=0,
+        message=message,
+    )
+
+    # Create usage information (extract if available)
+    usage = CompletionUsage(
+        completion_tokens=getattr(response.usage_metadata, "candidates_token_count", 0)
+        if hasattr(response, "usage_metadata")
+        else 0,
+        prompt_tokens=getattr(response.usage_metadata, "prompt_token_count", 0)
+        if hasattr(response, "usage_metadata")
+        else 0,
+        total_tokens=getattr(response.usage_metadata, "total_token_count", 0)
+        if hasattr(response, "usage_metadata")
+        else 0,
+    )
+
+    # Build the final ChatCompletion object
+    return ChatCompletion(
+        id="google_genai_response",
+        model="google/genai",
+        object="chat.completion",
+        created=0,
+        choices=[choice],
+        usage=usage,
+    )
+
+
+class GoogleProvider(Provider):
+    def __init__(self, config: ApiConfig) -> None:
+        """Initialize Google GenAI provider."""
+        # Check if we should use Vertex AI or Gemini Developer API
+        self.use_vertex_ai = os.getenv("GOOGLE_USE_VERTEX_AI", "false").lower() == "true"
+
+        if self.use_vertex_ai:
+            # Vertex AI configuration
+            self.project_id = os.getenv("GOOGLE_PROJECT_ID")
+            self.location = os.getenv("GOOGLE_REGION", "us-central1")
+
+            if not self.project_id:
+                msg = "GOOGLE_PROJECT_ID environment variable is required for Vertex AI"
+                raise ValueError(msg)
+
+            # Initialize client for Vertex AI
+            self.client = genai.Client(vertexai=True, project=self.project_id, location=self.location)
+        else:
+            # Gemini Developer API configuration
+            api_key = os.getenv("GEMINI_API_KEY") or os.getenv("GOOGLE_API_KEY")
+
+            if not api_key:
+                msg = "GEMINI_API_KEY or GOOGLE_API_KEY environment variable is required for Gemini Developer API"
+                raise ValueError(msg)
+
+            # Initialize client for Gemini Developer API
+            self.client = genai.Client(api_key=api_key)
+
+    def completion(
+        self,
+        model: str,
+        messages: list[dict[str, Any]],
+        **kwargs: Any,
+    ) -> ChatCompletion:
+        """Create a chat completion using Google GenAI."""
+        kwargs = _convert_kwargs(kwargs)
+
+        # Set the temperature if provided, otherwise use the default
+        temperature = kwargs.get("temperature", DEFAULT_TEMPERATURE)
+
+        # Convert messages to GenAI format
+        formatted_messages = _convert_messages(messages)
+
+        # Handle tools if provided
+        tools = kwargs.get("tools")
+
+        # Create generation config
+        generation_config = types.GenerateContentConfig(
+            temperature=temperature,
+            tools=tools,
+        )
+
+        # Generate content using the client
+        # For now, let's use a simple string-based approach
+        content_text = ""
+
+        if len(formatted_messages) == 1 and formatted_messages[0].role == "user":
+            # Single user message
+            parts = formatted_messages[0].parts
+            if parts and hasattr(parts[0], "text"):
+                content_text = parts[0].text or ""
+            else:
+                content_text = "Hello"  # fallback
+        else:
+            # Multiple messages - concatenate user messages for simplicity
+            content_parts = []
+            for msg in formatted_messages:
+                if msg.role == "user" and msg.parts:
+                    if hasattr(msg.parts[0], "text") and msg.parts[0].text:
+                        content_parts.append(msg.parts[0].text)
+
+            content_text = "\n".join(content_parts)
+            if not content_text:
+                content_text = "Hello"  # fallback
+
+        response = self.client.models.generate_content(model=model, contents=content_text, config=generation_config)
+
+        # Convert and return the response
+        return _convert_response(response)
diff --git a/src/any_llm/providers/openai/base.py b/src/any_llm/providers/openai/base.py
@@ -39,10 +39,6 @@ def __init__(self, config: ApiConfig) -> None:
 
         # Get API key from environment if not provided in config
         api_key = config.api_key or os.getenv(self.ENV_API_KEY_NAME)
-        if api_key is None:
-            msg = f"No {self.PROVIDER_NAME} API key provided. Please provide it in the config or set the {self.ENV_API_KEY_NAME} environment variable."
-            raise ValueError(msg)
-
         client_kwargs["api_key"] = api_key
 
         # Create the OpenAI client
diff --git a/tests/integration/__init__.py b/tests/integration/__init__.py
diff --git a/tests/integration/test_completion.py b/tests/integration/test_completion.py

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+from .google import GoogleProvider`
	`2`	`+`
	`3`	`+__all__ = ["GoogleProvider"]`