Add gpt4all provider - offline

Simatwa · Simatwa · commit 61af2712f189 · 2024-02-09T04:19:34.000+03:00
diff --git a/docs/CHANGELOG.md b/docs/CHANGELOG.md
@@ -360,4 +360,10 @@ For instance:
 
 - Execute python code in responses *(interactive)*- `exec`
 - Execute python codes using system installed python interpreter - *default*
-- Other minor fixes.
+- Other minor fixes.
+
+## v0.4.5
+
+**What's new?**
+
+- New model : **GPT4ALL** - Support offline LLM.
diff --git a/docs/README.md b/docs/README.md
@@ -44,6 +44,7 @@ This project enables seamless interaction with over **45 free LLM providers** wi
 
 The name *python-tgpt* draws inspiration from its parent project [tgpt](https://github.com/aandrew-me/tgpt), which operates on [Golang](https://go.dev/). Through this Python adaptation, users can effortlessly engage with a number of free LLMs available, fostering a smoother AI interaction experience.
 
+
 ### Features
 
 - 🗨️ Enhanced conversational chat experience
@@ -57,6 +58,7 @@ The name *python-tgpt* draws inspiration from its parent project [tgpt](https://
 - 🤖 Pass [awesome-chatgpt prompts](https://github.com/f/awesome-chatgpt-prompts) easily
 - 🧠 Multiple LLM providers - **45+**
 - 🎯 Customizable script generation and execution
+- 🔌 Offline support for Large Language Models
 
 ## Providers
 
@@ -71,6 +73,7 @@ These are simply the hosts of the LLMs, which include:
 9. [Phind](https://www.phind.com) - *default*
 10. [Llama2](https://www.llama2.ai)
 11. [Blackboxai](https://www.blackbox.ai)
+12. [gpt4all](https://gpt4all.io) *(Offline)*
 
 <details>
 
diff --git a/requirements.txt b/requirements.txt
@@ -10,3 +10,4 @@ colorama==0.4.6
 g4f>=0.2.1.0
 pyyaml==6.0.1
 matplotlib
+gpt4all==2.2.0
diff --git a/setup.py b/setup.py
@@ -9,6 +9,7 @@
     "requests==2.28.2",
     "appdirs==1.4.4",
     "pyyaml==6.0.1",
+    "gpt4all==2.2.0",
 ]
 
 cli_reqs = [
@@ -36,7 +37,7 @@
 
 setup(
     name="python-tgpt",
-    version="0.4.4",
+    version="0.4.5",
     license="MIT",
     author="Smartwa",
     maintainer="Smartwa",
@@ -78,6 +79,8 @@
         "openai",
         "bard",
         "gpt4free",
+        "gpt4all-cli",
+        "gptcli",
     ],
     long_description=Path.open("README.md", encoding="utf-8").read(),
     long_description_content_type="text/markdown",
diff --git a/src/pytgpt/__init__.py b/src/pytgpt/__init__.py
@@ -1,7 +1,7 @@
 from .utils import appdir
 import g4f
 
-__version__ = "0.4.4"
+__version__ = "0.4.5"
 __author__ = "Smartwa"
 __repo__ = "https://github.com/Simatwa/python-tgpt"
 
@@ -14,6 +14,7 @@
     "phind",
     "llama2",
     "blackboxai",
+    "gpt4all",
 ]
 
 gpt4free_providers = [
diff --git a/src/pytgpt/console.py b/src/pytgpt/console.py
@@ -498,6 +498,26 @@ def __init__(
                     act=awesome_prompt,
                 )
 
+            elif provider == "gpt4all":
+                from pytgpt.gpt4all import GPT4ALL
+
+                assert (
+                    auth
+                ), f"Path to LLM (.gguf or .bin) file is required. Use the flag `--key` or `-k`"
+                self.bot = GPT4ALL(
+                    model=auth,
+                    is_conversation=disable_conversation,
+                    max_tokens=max_tokens,
+                    temperature=temperature,
+                    presence_penalty=top_p,
+                    frequency_penalty=top_k,
+                    top_p=top_p,
+                    intro=intro,
+                    filepath=filepath,
+                    update_file=update_file,
+                    history_offset=history_offset,
+                )
+
             elif provider in pytgpt.gpt4free_providers:
                 from pytgpt.gpt4free import GPT4FREE
 
@@ -1037,7 +1057,7 @@ class ChatInteractive:
         "-k",
         "--key",
         envvar="auth_key",
-        help="LLM API access key or auth value",
+        help="LLM API access key or auth value or path to LLM with provider.",
     )
     @click.option(
         "-ct",
@@ -1314,7 +1334,7 @@ class ChatGenerate:
         "-k",
         "--key",
         envvar="auth_key",
-        help="LLM API access key or auth value",
+        help="LLM API access key or auth value or path to LLM with provider.",
     )
     @click.option(
         "-ct",
diff --git a/src/pytgpt/gpt4all/__init__.py b/src/pytgpt/gpt4all/__init__.py
@@ -0,0 +1,7 @@
+from .main import GPT4ALL
+
+__info__ = "Interact with offline models"
+
+__all__ = [
+    "GPT4ALL",
+]
diff --git a/src/pytgpt/gpt4all/main.py b/src/pytgpt/gpt4all/main.py
@@ -0,0 +1,206 @@
+from pytgpt.utils import Optimizers
+from pytgpt.utils import Conversation
+from pytgpt.utils import AwesomePrompts
+from pytgpt.base import Provider
+from gpt4all import GPT4All
+from gpt4all.gpt4all import empty_chat_session
+from gpt4all.gpt4all import append_extension_if_missing
+
+
+import logging
+
+my_logger = logging.getLogger("gpt4all")
+my_logger.setLevel(logging.CRITICAL)
+
+
+class GPT4ALL(Provider):
+    def __init__(
+        self,
+        model: str,
+        is_conversation: bool = True,
+        max_tokens: int = 800,
+        temperature: float = 0.7,
+        presence_penalty: int = 0,
+        frequency_penalty: int = 1.18,
+        top_p: float = 0.4,
+        intro: str = None,
+        filepath: str = None,
+        update_file: bool = True,
+        history_offset: int = 10250,
+        act: str = None,
+    ):
+        """Instantiates GPT4ALL
+
+        Args:
+            model (str, optional): Path to LLM model (.gguf or .bin).
+            is_conversation (bool, optional): Flag for chatting conversationally. Defaults to True.
+            max_tokens (int, optional): Maximum number of tokens to be generated upon completion. Defaults to 800.
+            temperature (float, optional): Charge of the generated text's randomness. Defaults to 0.7.
+            presence_penalty (int, optional): Chances of topic being repeated. Defaults to 0.
+            frequency_penalty (int, optional): Chances of word being repeated. Defaults to 1.18.
+            top_p (float, optional): Sampling threshold during inference time. Defaults to 0.4.
+            intro (str, optional): Conversation introductory prompt. Defaults to None.
+            filepath (str, optional): Path to file containing conversation history. Defaults to None.
+            update_file (bool, optional): Add new prompts and responses to the file. Defaults to True.
+            history_offset (int, optional): Limit conversation history to this number of last texts. Defaults to 10250.
+            act (str|int, optional): Awesome prompt key or index. (Used as intro). Defaults to None.
+        """
+        self.is_conversation = is_conversation
+        self.max_tokens_to_sample = max_tokens
+        self.model = model
+        self.temperature = temperature
+        self.presence_penalty = presence_penalty
+        self.frequency_penalty = frequency_penalty
+        self.top_p = top_p
+        self.last_response = {}
+
+        self.__available_optimizers = (
+            method
+            for method in dir(Optimizers)
+            if callable(getattr(Optimizers, method)) and not method.startswith("__")
+        )
+        Conversation.intro = (
+            AwesomePrompts().get_act(
+                act, raise_not_found=True, default=None, case_insensitive=True
+            )
+            if act
+            else intro or Conversation.intro
+        )
+        self.conversation = Conversation(
+            is_conversation, self.max_tokens_to_sample, filepath, update_file
+        )
+        self.conversation.history_offset = history_offset
+
+        def get_model_name_path():
+            import os
+            from pathlib import Path
+
+            initial_model_path = Path(append_extension_if_missing(model))
+            if initial_model_path.exists:
+                if not initial_model_path.is_absolute():
+                    initial_model_path = Path(os.getcwd()) / initial_model_path
+                return os.path.split(initial_model_path.as_posix())
+            else:
+                raise FileNotFoundError(
+                    "File does not exist " + initial_model_path.as_posix()
+                )
+
+        model_dir, model_name = get_model_name_path()
+
+        self.gpt4all = GPT4All(
+            model_name=model_name,
+            model_path=model_dir,
+            allow_download=False,
+            verbose=False,
+        )
+
+    def ask(
+        self,
+        prompt: str,
+        stream: bool = False,
+        raw: bool = False,
+        optimizer: str = None,
+        conversationally: bool = False,
+    ) -> dict:
+        """Chat with AI
+
+        Args:
+            prompt (str): Prompt to be send.
+            stream (bool, optional): Flag for streaming response. Defaults to False.
+            raw (bool, optional): Stream back raw response as received. Defaults to False.
+            optimizer (str, optional): Prompt optimizer name - `[code, shell_command]`. Defaults to None.
+            conversationally (bool, optional): Chat conversationally when using optimizer. Defaults to False.
+        Returns:
+           dict : {}
+        ```json
+        {
+           "text" : "How may I help you today?"
+        }
+        ```
+        """
+        conversation_prompt = self.conversation.gen_complete_prompt(prompt)
+        if optimizer:
+            if optimizer in self.__available_optimizers:
+                conversation_prompt = getattr(Optimizers, optimizer)(
+                    conversation_prompt if conversationally else prompt
+                )
+            else:
+                raise Exception(
+                    f"Optimizer is not one of {self.__available_optimizers}"
+                )
+
+        def for_stream():
+            response = self.gpt4all.generate(
+                prompt=conversation_prompt,
+                max_tokens=self.max_tokens_to_sample,
+                temp=self.temperature,
+                top_p=self.top_p,
+                repeat_penalty=self.frequency_penalty,
+                streaming=True,
+            )
+
+            message_load: str = ""
+            for token in response:
+                message_load += token
+                resp: dict = dict(text=message_load)
+                yield token if raw else resp
+                self.last_response.update(resp)
+
+            self.conversation.update_chat_history(
+                prompt, self.get_message(self.last_response)
+            )
+            self.gpt4all.current_chat_session = empty_chat_session()
+
+        def for_non_stream():
+            for _ in for_stream():
+                pass
+            return self.last_response
+
+        return for_stream() if stream else for_non_stream()
+
+    def chat(
+        self,
+        prompt: str,
+        stream: bool = False,
+        optimizer: str = None,
+        conversationally: bool = False,
+    ) -> str:
+        """Generate response `str`
+        Args:
+            prompt (str): Prompt to be send.
+            stream (bool, optional): Flag for streaming response. Defaults to False.
+            optimizer (str, optional): Prompt optimizer name - `[code, shell_command]`. Defaults to None.
+            conversationally (bool, optional): Chat conversationally when using optimizer. Defaults to False.
+        Returns:
+            str: Response generated
+        """
+
+        def for_stream():
+            for response in self.ask(
+                prompt, True, optimizer=optimizer, conversationally=conversationally
+            ):
+                yield self.get_message(response)
+
+        def for_non_stream():
+            return self.get_message(
+                self.ask(
+                    prompt,
+                    False,
+                    optimizer=optimizer,
+                    conversationally=conversationally,
+                )
+            )
+
+        return for_stream() if stream else for_non_stream()
+
+    def get_message(self, response: dict) -> str:
+        """Retrieves message only from response
+
+        Args:
+            response (str): Response generated by `self.ask`
+
+        Returns:
+            str: Message extracted
+        """
+        assert isinstance(response, dict), "Response should be of dict data-type only"
+        return response["text"]