scaleapi
diff --git a/‎examples/tutorials/00_sync/000_hello_acp/tests/test_agent.py‎
Lines changed: 41 additions & 106 deletions b/‎examples/tutorials/00_sync/000_hello_acp/tests/test_agent.py‎
Lines changed: 41 additions & 106 deletions
diff --git a/‎examples/tutorials/00_sync/010_multiturn/tests/test_agent.py‎
Lines changed: 54 additions & 125 deletions b/‎examples/tutorials/00_sync/010_multiturn/tests/test_agent.py‎
Lines changed: 54 additions & 125 deletions
@@ -1,129 +1,64 @@
 """
-Sample tests for AgentEx ACP agent.
+Tests for s000-hello-acp (sync agent)
 
-This test suite demonstrates how to test the main AgentEx API functions:
+This test suite demonstrates testing a sync agent using the AgentEx testing framework.
+
+Test coverage:
 - Non-streaming message sending
 - Streaming message sending
-- Task creation via RPC
 
-To run these tests:
-1. Make sure the agent is running (via docker-compose or `agentex agents run`)
-2. Set the AGENTEX_API_BASE_URL environment variable if not using default
-3. Run: pytest test_agent.py -v
+Prerequisites:
+    - AgentEx services running (make dev)
+    - Agent running: agentex agents run --manifest manifest.yaml
 
-Configuration:
-- AGENTEX_API_BASE_URL: Base URL for the AgentEx server (default: http://localhost:5003)
-- AGENT_NAME: Name of the agent to test (default: hello-acp)
+Run tests:
+    pytest tests/test_agent.py -v
 """
 
-import os
+from agentex.lib.testing import (
+    test_sync_agent,
+    collect_streaming_deltas,
+    assert_valid_agent_response,
+)
 
-import pytest
+AGENT_NAME = "s000-hello-acp"
 
-from agentex import Agentex
-from agentex.types import TextDelta, TextContent, TextContentParam
-from agentex.types.agent_rpc_params import ParamsSendMessageRequest
-from agentex.types.task_message_update import StreamTaskMessageFull, StreamTaskMessageDelta
 
-# Configuration from environment variables
-AGENTEX_API_BASE_URL = os.environ.get("AGENTEX_API_BASE_URL", "http://localhost:5003")
-AGENT_NAME = os.environ.get("AGENT_NAME", "s000-hello-acp")
+def test_send_simple_message():
+    """Test sending a simple message and receiving a response."""
+    with test_sync_agent(agent_name=AGENT_NAME) as test:
+        message_content = "Hello, Agent! How are you?"
+        response = test.send_message(message_content)
 
+        # Validate response
+        assert_valid_agent_response(response)
 
-@pytest.fixture
-def client():
-    """Create an AgentEx client instance for testing."""
-    client = Agentex(base_url=AGENTEX_API_BASE_URL)
-    yield client
-    # Clean up: close the client connection
-    client.close()
+        # Check expected response format
+        expected = f"Hello! I've received your message. Here's a generic response, but in future tutorials we'll see how you can get me to intelligently respond to your message. This is what I heard you say: {message_content}"
+        assert response.content == expected, f"Expected: {expected}\nGot: {response.content}"
 
 
-@pytest.fixture
-def agent_name():
-    """Return the agent name for testing."""
-    return AGENT_NAME
+def test_stream_simple_message():
+    """Test streaming a simple message and aggregating deltas."""
+    with test_sync_agent(agent_name=AGENT_NAME) as test:
+        message_content = "Hello, Agent! Can you stream your response?"
 
+        # Get streaming response
+        response_gen = test.send_message_streaming(message_content)
 
-class TestNonStreamingMessages:
-    """Test non-streaming message sending."""
+        # Collect streaming deltas
+        aggregated_content, chunks = collect_streaming_deltas(response_gen)
 
-    def test_send_simple_message(self, client: Agentex, agent_name: str):
-        """Test sending a simple message and receiving a response."""
+        # Validate we got content
+        assert len(chunks) > 0, "Should receive at least one chunk"
+        assert len(aggregated_content) > 0, "Should receive content"
 
-        message_content = "Hello, Agent! How are you?"
-        response = client.agents.send_message(
-            agent_name=agent_name,
-            params=ParamsSendMessageRequest(
-                content=TextContentParam(
-                    author="user",
-                    content=message_content,
-                    type="text",
-                )
-            ),
-        )
-        result = response.result
-        assert result is not None
-        assert len(result) == 1
-        message = result[0]
-        assert isinstance(message.content, TextContent)
-        assert (
-            message.content.content
-            == f"Hello! I've received your message. Here's a generic response, but in future tutorials we'll see how you can get me to intelligently respond to your message. This is what I heard you say: {message_content}"
-        )
-
-
-class TestStreamingMessages:
-    """Test streaming message sending."""
-
-    def test_stream_simple_message(self, client: Agentex, agent_name: str):
-        """Test streaming a simple message and aggregating deltas."""
-
-        message_content = "Hello, Agent! Can you stream your response?"
-        aggregated_content = ""
-        full_content = ""
-        received_chunks = False
-
-        for chunk in client.agents.send_message_stream(
-            agent_name=agent_name,
-            params=ParamsSendMessageRequest(
-                content=TextContentParam(
-                    author="user",
-                    content=message_content,
-                    type="text",
-                )
-            ),
-        ):
-            received_chunks = True
-            task_message_update = chunk.result
-            # Collect text deltas as they arrive or check full messages
-            if isinstance(task_message_update, StreamTaskMessageDelta) and task_message_update.delta is not None:
-                delta = task_message_update.delta
-                if isinstance(delta, TextDelta) and delta.text_delta is not None:
-                    aggregated_content += delta.text_delta
-
-            elif isinstance(task_message_update, StreamTaskMessageFull):
-                content = task_message_update.content
-                if isinstance(content, TextContent):
-                    full_content = content.content
-
-        if not full_content and not aggregated_content:
-            raise AssertionError("No content was received in the streaming response.")
-        if not received_chunks:
-            raise AssertionError("No streaming chunks were received, when at least 1 was expected.")
-
-        if full_content:
-            assert (
-                full_content
-                == f"Hello! I've received your message. Here's a generic response, but in future tutorials we'll see how you can get me to intelligently respond to your message. This is what I heard you say: {message_content}"
-            )
-
-        if aggregated_content:
-            assert (
-                aggregated_content
-                == f"Hello! I've received your message. Here's a generic response, but in future tutorials we'll see how you can get me to intelligently respond to your message. This is what I heard you say: {message_content}"
-            )
+        # Check expected response format
+        expected = f"Hello! I've received your message. Here's a generic response, but in future tutorials we'll see how you can get me to intelligently respond to your message. This is what I heard you say: {message_content}"
+        assert aggregated_content == expected, f"Expected: {expected}\nGot: {aggregated_content}"
 
 
 if __name__ == "__main__":
+    import pytest
+
     pytest.main([__file__, "-v"])
@@ -1,154 +1,83 @@
 """
-Sample tests for AgentEx ACP agent.
+Tests for s010-multiturn (sync agent)
 
-This test suite demonstrates how to test the main AgentEx API functions:
-- Non-streaming message sending
-- Streaming message sending
-- Task creation via RPC
+This test suite demonstrates testing a multi-turn sync agent using the AgentEx testing framework.
 
-To run these tests:
-1. Make sure the agent is running (via docker-compose or `agentex agents run`)
-2. Set the AGENTEX_API_BASE_URL environment variable if not using default
-3. Run: pytest test_agent.py -v
+Test coverage:
+- Multi-turn non-streaming conversation
+- Multi-turn streaming conversation
+- State management across turns
 
-Configuration:
-- AGENTEX_API_BASE_URL: Base URL for the AgentEx server (default: http://localhost:5003)
-- AGENT_NAME: Name of the agent to test (default: s010-multiturn)
-"""
-
-import os
-
-import pytest
-from test_utils.sync import validate_text_in_string, collect_streaming_response
-
-from agentex import Agentex
-from agentex.types import TextContent, TextContentParam
-from agentex.types.agent_rpc_params import ParamsCreateTaskRequest, ParamsSendMessageRequest
-from agentex.lib.sdk.fastacp.base.base_acp_server import uuid
-
-# Configuration from environment variables
-AGENTEX_API_BASE_URL = os.environ.get("AGENTEX_API_BASE_URL", "http://localhost:5003")
-AGENT_NAME = os.environ.get("AGENT_NAME", "s010-multiturn")
+Prerequisites:
+    - AgentEx services running (make dev)
+    - Agent running: agentex agents run --manifest manifest.yaml
 
+Run tests:
+    pytest tests/test_agent.py -v
+"""
 
-@pytest.fixture
-def client():
-    """Create an AgentEx client instance for testing."""
-    return Agentex(base_url=AGENTEX_API_BASE_URL)
-
+from agentex.lib.testing import (
+    test_sync_agent,
+    collect_streaming_deltas,
+    assert_valid_agent_response,
+    assert_agent_response_contains,
+)
 
-@pytest.fixture
-def agent_name():
-    """Return the agent name for testing."""
-    return AGENT_NAME
+AGENT_NAME = "s010-multiturn"
 
 
-@pytest.fixture
-def agent_id(client, agent_name):
-    """Retrieve the agent ID based on the agent name."""
-    agents = client.agents.list()
-    for agent in agents:
-        if agent.name == agent_name:
-            return agent.id
-    raise ValueError(f"Agent with name {agent_name} not found.")
+def test_multiturn_conversation():
+    """Test multi-turn conversation with non-streaming messages."""
+    with test_sync_agent(agent_name=AGENT_NAME) as test:
+        messages = [
+            "Hello, can you tell me a little bit about tennis? I want to you make sure you use the word 'tennis' in each response.",
+            "Pick one of the things you just mentioned, and dive deeper into it.",
+            "Can you now output a summary of this conversation",
+        ]
 
+        for msg in messages:
+            response = test.send_message(msg)
 
-class TestNonStreamingMessages:
-    """Test non-streaming message sending."""
+            # Validate response
+            assert_valid_agent_response(response)
 
-    def test_send_message(self, client: Agentex, agent_name: str, agent_id: str):
-        task_response = client.agents.create_task(agent_id, params=ParamsCreateTaskRequest(name=uuid.uuid1().hex))
-        task = task_response.result
+            # Validate "tennis" appears in response (per agent's behavior)
+            assert_agent_response_contains(response, "tennis")
 
-        assert task is not None
+        # Verify conversation history
+        history = test.get_conversation_history()
+        assert len(history) >= 6, f"Expected >= 6 messages (3 user + 3 agent), got {len(history)}"
 
-        messages = [
-            "Hello, can you tell me a litle bit about tennis? I want to you make sure you use the word 'tennis' in each response.",
-            "Pick one of the things you just mentioned, and dive deeper into it.",
-            "Can you now output a summary of this conversation",
-        ]
 
-        for i, msg in enumerate(messages):
-            response = client.agents.send_message(
-                agent_name=agent_name,
-                params=ParamsSendMessageRequest(
-                    content=TextContentParam(
-                        author="user",
-                        content=msg,
-                        type="text",
-                    ),
-                    task_id=task.id,
-                ),
-            )
-            assert response is not None and response.result is not None
-            result = response.result
-
-            for message in result:
-                content = message.content
-                assert content is not None
-                assert isinstance(content, TextContent) and isinstance(content.content, str)
-                validate_text_in_string("tennis", content.content)
-
-            states = client.states.list(agent_id=agent_id, task_id=task.id)
-            assert len(states) == 1
-
-            state = states[0]
-            assert state.state is not None
-            assert state.state.get("system_prompt", None) == "You are a helpful assistant that can answer questions."
-
-            message_history = client.messages.list(
-                task_id=task.id,
-            )
-            assert len(message_history) == (i + 1) * 2  # user + agent messages
-
-
-class TestStreamingMessages:
-    """Test streaming message sending."""
-
-    def test_stream_message(self, client: Agentex, agent_name: str, agent_id: str):
-        """Test streaming messages in a multi-turn conversation."""
-
-        # create a task for this specific conversation
-        task_response = client.agents.create_task(agent_id, params=ParamsCreateTaskRequest(name=uuid.uuid1().hex))
-        task = task_response.result
-
-        assert task is not None
+def test_multiturn_streaming():
+    """Test multi-turn conversation with streaming messages."""
+    with test_sync_agent(agent_name=AGENT_NAME) as test:
         messages = [
             "Hello, can you tell me a little bit about tennis? I want you to make sure you use the word 'tennis' in each response.",
             "Pick one of the things you just mentioned, and dive deeper into it.",
             "Can you now output a summary of this conversation",
         ]
 
-        for i, msg in enumerate(messages):
-            stream = client.agents.send_message_stream(
-                agent_name=agent_name,
-                params=ParamsSendMessageRequest(
-                    content=TextContentParam(
-                        author="user",
-                        content=msg,
-                        type="text",
-                    ),
-                    task_id=task.id,
-                ),
-            )
+        for msg in messages:
+            # Get streaming response
+            response_gen = test.send_message_streaming(msg)
 
-            # Collect the streaming response
-            aggregated_content, chunks = collect_streaming_response(stream)
+            # Collect streaming deltas
+            aggregated_content, chunks = collect_streaming_deltas(response_gen)
 
-            assert len(chunks) == 1
-            # Get the actual content (prefer full_content if available, otherwise use aggregated)
+            # Validate we got content
+            assert len(chunks) > 0, "Should receive chunks"
+            assert len(aggregated_content) > 0, "Should receive content"
 
-            # Validate that "tennis" appears in the response because that is what our model does
-            validate_text_in_string("tennis", aggregated_content)
+            # Validate "tennis" appears in response
+            assert "tennis" in aggregated_content.lower(), f"Expected 'tennis' in: {aggregated_content[:100]}"
 
-            states = client.states.list(task_id=task.id)
-            assert len(states) == 1
-
-            message_history = client.messages.list(
-                task_id=task.id,
-            )
-            assert len(message_history) == (i + 1) * 2  # user + agent messages
+        # Verify conversation history
+        history = test.get_conversation_history()
+        assert len(history) >= 6, f"Expected >= 6 messages, got {len(history)}"
 
 
 if __name__ == "__main__":
+    import pytest
+
     pytest.main([__file__, "-v"])