NimbleBoxAI
diff --git a/‎docs/changelog.rst‎
Lines changed: 14 additions & 0 deletions b/‎docs/changelog.rst‎
Lines changed: 14 additions & 0 deletions
diff --git a/‎docs/conf.py‎
Lines changed: 1 addition & 1 deletion b/‎docs/conf.py‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion b/‎pyproject.toml‎
Lines changed: 1 addition & 1 deletion
diff --git a/‎tuneapi/apis/__init__.py‎
Lines changed: 8 additions & 1 deletion b/‎tuneapi/apis/__init__.py‎
Lines changed: 8 additions & 1 deletion
diff --git a/‎tuneapi/apis/model_anthropic.py‎
Lines changed: 164 additions & 28 deletions b/‎tuneapi/apis/model_anthropic.py‎
Lines changed: 164 additions & 28 deletions
@@ -7,6 +7,20 @@ minor versions.
 
 All relevant steps to be taken will be mentioned here.
 
+8.0.5
+-----
+
+- Adding support for Batches API in Openai and Anthropic models
+  - Have not tested function calling on batches API
+  - Have not tested structured generation on batches API
+- Removed dependency on ``openai`` package for audio transcribing by figuring out uploading of files
+- Added new ``Ollama`` class which works with ``OpenAIProtocol``
+
+8.0.4
+-----
+
+- Bug fixes
+
 8.0.3
 -----
 
 
@@ -13,7 +13,7 @@
 project = "tuneapi"
 copyright = "2024-2025, Frello Technologies"
 author = "Frello Technologies"
-release = "8.0.3"
+release = "8.0.5"
 
 # -- General configuration ---------------------------------------------------
 # https://www.sphinx-doc.org/en/master/usage/configuration.html#general-configuration
 
@@ -1,6 +1,6 @@
 [tool.poetry]
 name = "tuneapi"
-version = "8.0.3"
+version = "8.0.5"
 description = "Tune AI APIs."
 authors = ["Frello Technology Private Limited <[email protected]>"]
 license = "MIT"
 
@@ -1,7 +1,14 @@
 # Copyright © 2024-2025 Frello Technology Private Limited
 
 # model APIs
-from tuneapi.apis.model_openai import Openai, TuneModel, Groq, Mistral, OpenAIProtocol
+from tuneapi.apis.model_openai import (
+    Openai,
+    TuneModel,
+    Groq,
+    Mistral,
+    Ollama,
+    OpenAIProtocol,
+)
 from tuneapi.apis.model_anthropic import Anthropic
 from tuneapi.apis.model_gemini import Gemini
 from tuneapi.apis.turbo import distributed_chat, distributed_chat_async
@@ -7,7 +7,7 @@
 import httpx
 import requests
 from copy import deepcopy
-from typing import Optional, Dict, Any, List
+from typing import Optional, Dict, Any, List, Tuple
 
 import tuneapi.utils as tu
 import tuneapi.types as tt
@@ -24,35 +24,27 @@ def __init__(
     ):
         self.model_id = id
         self.base_url = base_url
+        self.batch_url = base_url + "/batches"
         self.api_token = api_token or tu.ENV.ANTHROPIC_TOKEN("")
         self.extra_headers = extra_headers
 
     def set_api_token(self, token: str) -> None:
         self.api_token = token
 
-    def _process_input(
-        self,
-        chats: tt.Thread | str,
-        model: Optional[str] = None,
-        max_tokens: int = 1024,
-        temperature: Optional[float] = None,
-        token: Optional[str] = None,
-        debug: bool = False,
-        extra_headers: Optional[Dict[str, str]] = None,
-        **kwargs,
-    ):
+    def _process_header(self, token: str) -> Dict[str, str]:
         if not token and not self.api_token:  # type: ignore
             raise Exception(
                 "Please set ANTHROPIC_TOKEN environment variable or pass through function"
             )
         token = token or self.api_token
-        if isinstance(chats, tt.Thread):
-            thread = chats
-        elif isinstance(chats, str):
-            thread = tt.Thread(tt.human(chats))
-        else:
-            raise Exception("Invalid input")
+        return {
+            "x-api-key": token,
+            "Content-Type": "application/json",
+            "anthropic-version": "2023-06-01",
+            "anthropic-beta": "tools-2024-05-16",
+        }
 
+    def _process_thread(self, thread: tt.Thread) -> Tuple[str, List[Dict[str, Any]]]:
         # create the anthropic style data
         system = ""
         if thread.chats[0].role == tt.Message.SYSTEM:
@@ -134,13 +126,29 @@ def _process_input(
                 raise Exception(f"Unknown role: {m.role}")
             claude_messages.append(msg)
 
-        headers = {
-            "x-api-key": token,
-            "Content-Type": "application/json",
-            "anthropic-version": "2023-06-01",
-            "anthropic-beta": "tools-2024-05-16",
-        }
-        # return headers, system.strip(), claude_messages
+        return system, claude_messages
+
+    def _process_input(
+        self,
+        chats: tt.Thread | str,
+        model: Optional[str] = None,
+        max_tokens: int = 1024,
+        temperature: Optional[float] = None,
+        token: Optional[str] = None,
+        debug: bool = False,
+        extra_headers: Optional[Dict[str, str]] = None,
+        stream: bool = True,
+        **kwargs,
+    ):
+        if isinstance(chats, tt.Thread):
+            thread = chats
+        elif isinstance(chats, str):
+            thread = tt.Thread(tt.human(chats))
+        else:
+            raise Exception("Invalid input")
+
+        system, claude_messages = self._process_thread(thread)
+        headers = self._process_header(token)
 
         tools = []
         if isinstance(chats, tt.Thread) and chats.tools:
@@ -157,7 +165,7 @@ def _process_input(
             "messages": claude_messages,
             "system": system,
             "tools": tools,
-            "stream": True,
+            "stream": stream,
         }
         if temperature:
             data["temperature"] = temperature
@@ -274,7 +282,7 @@ def stream_chat(
         self,
         chats: tt.Thread | str,
         model: Optional[str] = None,
-        max_tokens: int = 1024,
+        max_tokens: int = 4096,
         temperature: Optional[float] = None,
         token: Optional[str] = None,
         debug: bool = False,
@@ -355,7 +363,7 @@ async def stream_chat_async(
         self,
         chats: tt.Thread | str,
         model: Optional[str] = None,
-        max_tokens: int = 1024,
+        max_tokens: int = 4096,
         temperature: Optional[float] = None,
         token: Optional[str] = None,
         debug: bool = False,
@@ -439,3 +447,131 @@ async def distributed_chat_async(
             debug=debug,
             **kwargs,
         )
+
+    def submit_batch(
+        self,
+        threads: List[tt.Thread | str],
+        model: Optional[str] = None,
+        max_tokens: int = 4096,
+        temperature: Optional[float] = None,
+        token: Optional[str] = None,
+        debug: bool = False,
+        extra_headers: Optional[Dict[str, str]] = None,
+        timeout=(5, 30),
+        raw: bool = False,
+        **kwargs,
+    ) -> Tuple[str, List[str]] | Dict:
+        bodies = []
+        custom_ids = []
+        for chats in threads:
+            headers, data = self._process_input(
+                chats=chats,
+                model=model,
+                max_tokens=max_tokens,
+                temperature=temperature,
+                token=token,
+                extra_headers=extra_headers,
+                stream=False,
+                **kwargs,
+            )
+            custom_id = "tuneapi_" + tu.get_random_string(10)
+            custom_ids.append(custom_id)
+            bodies.append({"custom_id": custom_id, "params": data})
+        body = {"requests": bodies}
+        if debug:
+            fp = "sample_anthropic_batch.json"
+            print("Saving at path " + fp)
+            tu.to_json(body, fp=fp)
+
+        r = requests.post(
+            url=self.batch_url,
+            headers=headers,
+            timeout=timeout,
+            json=body,
+        )
+        try:
+            r.raise_for_status()
+        except Exception as e:
+            tu.logger.error(f"Coudn't submit batch: {r.text}")
+            raise e
+        resp = r.json()
+
+        if raw:
+            return resp
+        return resp["id"], custom_ids
+
+    def get_batch(
+        self,
+        batch_id: str,
+        custom_ids: Optional[List[str]] = None,
+        usage: bool = False,
+        token: Optional[str] = None,
+        raw: bool = False,
+        verbose: bool = False,
+    ) -> Tuple[List[Any] | Dict, str | None]:
+        headers = self._process_header(token)
+        r = requests.get(self.batch_url + "/" + batch_id, headers=headers)
+        try:
+            r.raise_for_status()
+        except Exception as e:
+            tu.logger.error(f"Coudn't get batch: {r.text}")
+            raise e
+        resp = r.json()
+        if resp["processing_status"] != "ended":
+            if verbose:
+                tu.logger.info(
+                    f"Batch {batch_id} has not ended. Status: {resp['processing_status']}"
+                )
+            return None, resp["processing_status"]
+        results_url = resp["results_url"]
+
+        # fetch the results, response is a JSONL, fucntion return shoudl be a List of JSONs
+        r = requests.get(results_url, headers=headers)
+        try:
+            r.raise_for_status()
+        except Exception as e:
+            tu.logger.error(f"Coudn't get batch results: {r.text}")
+            raise e
+
+        output = []
+        for line in r.iter_lines():
+            if not line:
+                continue
+            output.append(tu.from_json(line))
+
+        if custom_ids:
+            # each item in output has a key called "custom_id" sort on the basis of incoming custom_ids
+            output = sorted(output, key=lambda x: custom_ids.index(x["custom_id"]))
+
+        if raw:
+            return output, None
+
+        _usage = tt.Usage(0, 0)
+        for o in output:
+            u = o["result"]["message"]["usage"]
+            _usage += tt.Usage(
+                input_tokens=u.pop("input_tokens"),
+                output_tokens=u.pop("output_tokens"),
+                cached_tokens=u.get("cache_read_input_tokens", 0)
+                or u.get("cache_creation_input_tokens", 0),
+                **u,
+            )
+
+        parsed_output = [o["result"]["message"]["content"][0] for o in output]
+        final_output = []
+        for o in parsed_output:
+            if o["type"] == "text":
+                final_output.append(o["text"])
+            elif o["type"] == "tool_use":
+                final_output.append(
+                    {
+                        "name": o["name"],
+                        "arguments": o["input"],
+                    }
+                )
+            else:
+                raise ValueError(f"Unknown message content: {o['type']}")
+
+        if usage:
+            return final_output, None, _usage
+        return final_output, None