Count tokens (#315)

MarkDaoust · web-flow · commit c165b20bb03a · 2024-05-03T12:10:21.000-07:00
* Upgrade count tokens, add usage metadata.

Change-Id: Ib07580b4f22db7e7c58109d6d0c8a27076f204da

* Fix usage_metadata for streaming, fix indentation in __str__.

Change-Id: I08ceb067355c933c20d50beb8ee51f9e7ba83ee7

* format

Change-Id: I11ed2499b974d7cacde88c740386a5f9a71186ea

* fix typing

Change-Id: Ieeae7eefebc330a4b856b0016912f4fce509d780
diff --git a/google/generativeai/generative_models.py b/google/generativeai/generative_models.py
@@ -322,35 +322,57 @@ async def generate_content_async(
     # fmt: off
     def count_tokens(
         self,
-        contents: content_types.ContentsType,
+        contents: content_types.ContentsType = None,
+        *,
+        generation_config: generation_types.GenerationConfigType | None = None,
+        safety_settings: safety_types.SafetySettingOptions | None = None,
+        tools: content_types.FunctionLibraryType | None = None,
+        tool_config: content_types.ToolConfigType | None = None,
         request_options: dict[str, Any] | None = None,
     ) -> glm.CountTokensResponse:
         if request_options is None:
             request_options = {}
 
         if self._client is None:
             self._client = client.get_default_generative_client()
-        contents = content_types.to_contents(contents)
-        return self._client.count_tokens(
-            glm.CountTokensRequest(model=self.model_name, contents=contents),
-                **request_options,
-        )
+
+        request = glm.CountTokensRequest(
+            model=self.model_name,
+            generate_content_request=self._prepare_request(
+                contents=contents,
+                generation_config=generation_config,
+                safety_settings=safety_settings,
+                tools=tools,
+                tool_config=tool_config,
+        ))
+        return self._client.count_tokens(request, **request_options)
 
     async def count_tokens_async(
         self,
-        contents: content_types.ContentsType,
+        contents: content_types.ContentsType = None,
+        *,
+        generation_config: generation_types.GenerationConfigType | None = None,
+        safety_settings: safety_types.SafetySettingOptions | None = None,
+        tools: content_types.FunctionLibraryType | None = None,
+        tool_config: content_types.ToolConfigType | None = None,
         request_options: dict[str, Any] | None = None,
     ) -> glm.CountTokensResponse:
         if request_options is None:
             request_options = {}
 
         if self._async_client is None:
             self._async_client = client.get_default_generative_async_client()
-        contents = content_types.to_contents(contents)
-        return await self._async_client.count_tokens(
-            glm.CountTokensRequest(model=self.model_name, contents=contents),
-                **request_options,
-        )
+
+        request = glm.CountTokensRequest(
+            model=self.model_name,
+            generate_content_request=self._prepare_request(
+                contents=contents,
+                generation_config=generation_config,
+                safety_settings=safety_settings,
+                tools=tools,
+                tool_config=tool_config,
+        ))
+        return await self._async_client.count_tokens(request, **request_options)
 
     # fmt: on
 
diff --git a/google/generativeai/types/generation_types.py b/google/generativeai/types/generation_types.py
@@ -16,10 +16,11 @@
 
 import collections
 import contextlib
-import sys
 from collections.abc import Iterable, AsyncIterable
 import dataclasses
 import itertools
+import json
+import sys
 import textwrap
 from typing import Union
 from typing_extensions import TypedDict
@@ -250,6 +251,7 @@ def _join_candidates(candidates: Iterable[glm.Candidate]):
         finish_reason=candidates[-1].finish_reason,
         safety_ratings=_join_safety_ratings_lists([c.safety_ratings for c in candidates]),
         citation_metadata=_join_citation_metadatas([c.citation_metadata for c in candidates]),
+        token_count=candidates[-1].token_count,
     )
 
 
@@ -276,9 +278,11 @@ def _join_prompt_feedbacks(
 
 
 def _join_chunks(chunks: Iterable[glm.GenerateContentResponse]):
+    chunks = tuple(chunks)
     return glm.GenerateContentResponse(
         candidates=_join_candidate_lists(c.candidates for c in chunks),
         prompt_feedback=_join_prompt_feedbacks(c.prompt_feedback for c in chunks),
+        usage_metadata=chunks[-1].usage_metadata,
     )
 
 
@@ -373,13 +377,21 @@ def text(self):
     def prompt_feedback(self):
         return self._result.prompt_feedback
 
+    @property
+    def usage_metadata(self):
+        return self._result.usage_metadata
+
     def __str__(self) -> str:
         if self._done:
             _iterator = "None"
         else:
             _iterator = f"<{self._iterator.__class__.__name__}>"
 
-        _result = f"glm.GenerateContentResponse({type(self._result).to_dict(self._result)})"
+        as_dict = type(self._result).to_dict(self._result)
+        json_str = json.dumps(as_dict, indent=2)
+
+        _result = f"glm.GenerateContentResponse({json_str})"
+        _result = _result.replace("\n", "\n                    ")
 
         if self._error:
             _error = f",\nerror=<{self._error.__class__.__name__}> {self._error}"
diff --git a/setup.py b/setup.py
@@ -42,7 +42,7 @@ def get_version():
     release_status = "Development Status :: 5 - Production/Stable"
 
 dependencies = [
-    "google-ai-generativelanguage==0.6.2",
+    "google-ai-generativelanguage@https://storage.googleapis.com/generativeai-downloads/preview/ai-generativelanguage-v1beta-py-2.tar.gz",
     "google-api-core",
     "google-api-python-client",
     "google-auth>=2.15.0",  # 2.15 adds API key auth support
diff --git a/tests/test_generation.py b/tests/test_generation.py
@@ -503,7 +503,24 @@ def test_repr_for_generate_content_response_from_response(self):
             GenerateContentResponse(
                 done=True,
                 iterator=None,
-                result=glm.GenerateContentResponse({'candidates': [{'content': {'parts': [{'text': 'Hello world!'}], 'role': ''}, 'finish_reason': 0, 'safety_ratings': [], 'token_count': 0, 'grounding_attributions': []}]}),
+                result=glm.GenerateContentResponse({
+                  "candidates": [
+                    {
+                      "content": {
+                        "parts": [
+                          {
+                            "text": "Hello world!"
+                          }
+                        ],
+                        "role": ""
+                      },
+                      "finish_reason": 0,
+                      "safety_ratings": [],
+                      "token_count": 0,
+                      "grounding_attributions": []
+                    }
+                  ]
+                }),
             )"""
         )
         self.assertEqual(expected, result)
@@ -522,7 +539,24 @@ def test_repr_for_generate_content_response_from_iterator(self):
             GenerateContentResponse(
                 done=False,
                 iterator=<list_iterator>,
-                result=glm.GenerateContentResponse({'candidates': [{'content': {'parts': [{'text': 'a'}], 'role': ''}, 'finish_reason': 0, 'safety_ratings': [], 'token_count': 0, 'grounding_attributions': []}]}),
+                result=glm.GenerateContentResponse({
+                  "candidates": [
+                    {
+                      "content": {
+                        "parts": [
+                          {
+                            "text": "a"
+                          }
+                        ],
+                        "role": ""
+                      },
+                      "finish_reason": 0,
+                      "safety_ratings": [],
+                      "token_count": 0,
+                      "grounding_attributions": []
+                    }
+                  ]
+                }),
             )"""
         )
         self.assertEqual(expected, result)
diff --git a/tests/test_generative_models.py b/tests/test_generative_models.py
diff --git a/tests/test_generative_models_async.py b/tests/test_generative_models_async.py