ai wip

sentrivana · sentrivana · commit 8a8bc5e9943e · 2025-10-02T16:00:44.000+02:00
we need an httpx mock version of all tests
diff --git a/scripts/populate_tox/config.py b/scripts/populate_tox/config.py
@@ -184,6 +184,7 @@
         "package": "huggingface_hub",
         "deps": {
             "*": ["responses"],
+            ">=1.0": ["pytest-httpx"],
         },
     },
     "langchain-base": {
diff --git a/tests/integrations/huggingface_hub/test_huggingface_hub.py b/tests/integrations/huggingface_hub/test_huggingface_hub.py
@@ -1,6 +1,8 @@
 from unittest import mock
 import pytest
+import re
 import responses
+import httpx
 
 from huggingface_hub import InferenceClient
 
@@ -76,6 +78,56 @@ def mock_hf_text_generation_api():
         yield rsps
 
 
+@pytest.fixture
+def mock_hf_text_generation_api_httpx(httpx_mock):
+    # type: (Any) -> Any
+    """Mock HuggingFace text generation API for httpx"""
+    model_name = "test-model"
+
+    # Mock model info endpoint (with query parameters) - allow multiple calls
+    # Using pattern matching to handle query parameters
+    model_url_pattern = re.compile(
+        re.escape(MODEL_ENDPOINT.format(model_name=model_name)) + r"(\?.*)?$"
+    )
+
+    # Add exactly the number of responses we expect (2 calls observed from debug output)
+    for _ in range(2):  # Allow exactly 2 calls to the model info endpoint
+        httpx_mock.add_response(
+            method="GET",
+            url=model_url_pattern,
+            json={
+                "id": model_name,
+                "pipeline_tag": "text-generation",
+                "inferenceProviderMapping": {
+                    "hf-inference": {
+                        "status": "live",
+                        "providerId": model_name,
+                        "task": "text-generation",
+                    }
+                },
+            },
+            status_code=200,
+        )
+
+    # Mock text generation endpoint
+    httpx_mock.add_response(
+        method="POST",
+        url=INFERENCE_ENDPOINT.format(model_name=model_name),
+        json={
+            "generated_text": "[mocked] Hello! How can i help you?",
+            "details": {
+                "finish_reason": "length",
+                "generated_tokens": 10,
+                "prefill": [],
+                "tokens": [],
+            },
+        },
+        status_code=200,
+    )
+
+    return httpx_mock
+
+
 @pytest.fixture
 def mock_hf_api_with_errors():
     # type: () -> Any
@@ -431,6 +483,63 @@ def test_text_generation(
     assert "gen_ai.response.model" not in span["data"]
 
 
+@pytest.mark.httpx_mock(assert_all_requests_were_expected=False)
+def test_text_generation_TODO(
+    sentry_init,
+    capture_events,
+    mock_hf_text_generation_api_httpx,
+):
+    # type: (Any, Any, Any) -> None
+    sentry_init(
+        traces_sample_rate=1.0,
+        send_default_pii=True,
+        integrations=[HuggingfaceHubIntegration(include_prompts=True)],
+    )
+    events = capture_events()
+
+    client = InferenceClient(model="test-model")
+
+    with sentry_sdk.start_transaction(name="test"):
+        client.text_generation(
+            "Hello",
+            stream=False,
+            details=True,
+        )
+
+    (transaction,) = events
+
+    # Find the huggingface_hub span (there might be httpx spans too)
+    hf_spans = [
+        span for span in transaction["spans"] if span["op"] == "gen_ai.generate_text"
+    ]
+    assert len(hf_spans) == 1, (
+        f"Expected 1 huggingface span, got {len(hf_spans)}: {[s['op'] for s in transaction['spans']]}"
+    )
+    span = hf_spans[0]
+
+    assert span["op"] == "gen_ai.generate_text"
+    assert span["description"] == "generate_text test-model"
+    assert span["origin"] == "auto.ai.huggingface_hub"
+
+    expected_data = {
+        "gen_ai.operation.name": "generate_text",
+        "gen_ai.request.model": "test-model",
+        "gen_ai.response.finish_reasons": "length",
+        "gen_ai.response.streaming": False,
+        "gen_ai.usage.total_tokens": 10,
+        "thread.id": mock.ANY,
+        "thread.name": mock.ANY,
+    }
+
+    expected_data["gen_ai.request.messages"] = "Hello"
+    expected_data["gen_ai.response.text"] = "[mocked] Hello! How can i help you?"
+
+    assert span["data"] == expected_data
+
+    # text generation does not set the response model
+    assert "gen_ai.response.model" not in span["data"]
+
+
 @pytest.mark.parametrize("send_default_pii", [True, False])
 @pytest.mark.parametrize("include_prompts", [True, False])
 def test_text_generation_streaming(
diff --git a/tox.ini b/tox.ini
@@ -391,6 +391,7 @@ deps =
     huggingface_hub-v0.32.6: huggingface_hub==0.32.6
     huggingface_hub-v0.35.3: huggingface_hub==0.35.3
     huggingface_hub-v1.0.0rc2: huggingface_hub==1.0.0rc2
+    huggingface_hub-v1.0.0rc2: pytest-httpx
     huggingface_hub: responses