added support for groq

splitbrain · splitbrain · commit 074b7701298b · 2024-04-22T18:26:23.000+02:00
diff --git a/Model/Groq/ChatModel.php b/Model/Groq/ChatModel.php
@@ -0,0 +1,65 @@
+<?php
+
+namespace dokuwiki\plugin\aichat\Model\Groq;
+
+use dokuwiki\plugin\aichat\Model\AbstractModel;
+use dokuwiki\plugin\aichat\Model\ChatInterface;
+
+class ChatModel extends AbstractModel implements ChatInterface
+{
+    /** @inheritdoc */
+    public function __construct(string $name, array $config)
+    {
+        parent::__construct($name, $config);
+
+        if (empty($config['groq_apikey'])) {
+            throw new \Exception('Groq API key not configured');
+        }
+
+        $this->http->headers['Authorization'] = 'Bearer '.$config['groq_apikey'];
+    }
+
+    /** @inheritdoc */
+    public function getAnswer(array $messages): string
+    {
+        $data = [
+            'messages' => $messages,
+            'model' => $this->getModelName(),
+            'max_tokens' => null,
+            'stream' => false,
+            'n' => 1, // number of completions
+            'temperature' => 0.0,
+        ];
+        $response = $this->request('chat/completions', $data);
+        return $response['choices'][0]['message']['content'];
+    }
+
+    /**
+     * Send a request to the API
+     *
+     * @param string $endpoint
+     * @param array $data Payload to send
+     * @return array API response
+     * @throws \Exception
+     */
+    protected function request($endpoint, $data)
+    {
+        $url = 'https://api.groq.com/openai/v1/' . $endpoint;
+        return $this->sendAPIRequest('POST', $url, $data);
+    }
+
+    /** @inheritdoc */
+    protected function parseAPIResponse($response)
+    {
+        if (isset($response['usage'])) {
+            $this->inputTokensUsed += $response['usage']['prompt_tokens'];
+            $this->outputTokensUsed += $response['usage']['completion_tokens'] ?? 0;
+        }
+
+        if (isset($response['error'])) {
+            throw new \Exception('Groq API error: ' . $response['error']['message']);
+        }
+
+        return $response;
+    }
+}
diff --git a/Model/Groq/models.json b/Model/Groq/models.json
@@ -0,0 +1,39 @@
+{
+    "chat": {
+        "llama3-8b-8192": {
+            "description": "LLaMA3 8b",
+            "inputTokens": 8192,
+            "inputTokenPrice": 0,
+            "outputTokens": 8192,
+            "outputTokenPrice": 0
+        },
+        "llama3-70b-8192": {
+            "description": "LLaMA3 70b",
+            "inputTokens": 8192,
+            "inputTokenPrice": 0,
+            "outputTokens": 8192,
+            "outputTokenPrice": 0
+        },
+        "llama2-70b-4096": {
+            "description": "LLaMA2 70b",
+            "inputTokens": 4096,
+            "inputTokenPrice": 0,
+            "outputTokens": 4096,
+            "outputTokenPrice": 0
+        },
+        "mixtral-8x7b-32768": {
+            "description": "Mixtral 8x7b",
+            "inputTokens": 32768,
+            "inputTokenPrice": 0,
+            "outputTokens": 32768,
+            "outputTokenPrice": 0
+        },
+        "gemma-7b-it": {
+            "description": "Gemma is a family of lightweight, state-of-the-art open models from Google, built from the same research and technology used to create the Gemini models. They are text-to-text, decoder-only large language models, available in English, with open weights, pre-trained variants, and instruction-tuned variants. Gemma models are well-suited for a variety of text generation tasks, including question answering, summarization, and reasoning. Their relatively small size makes it possible to deploy them in environments with limited resources such as a laptop, desktop or your own cloud infrastructure, democratizing access to state of the art AI models and helping foster innovation for everyone.",
+            "inputTokens": 8192,
+            "inputTokenPrice": 0,
+            "outputTokens": 8182,
+            "outputTokenPrice": 0
+        }
+    }
+}
diff --git a/Model/Ollama/AbstractOllama.php b/Model/Ollama/AbstractOllama.php
@@ -0,0 +1,55 @@
+<?php
+
+namespace dokuwiki\plugin\aichat\Model\Ollama;
+
+use dokuwiki\plugin\aichat\Model\AbstractModel;
+
+/**
+ * Abstract OpenAI Model
+ *
+ * This class provides a basic interface to the OpenAI API
+ */
+abstract class AbstractOllama extends AbstractModel
+{
+    protected $apiurl = 'http://localhost:11434/api/';
+
+    /** @inheritdoc */
+    public function __construct(string $name, array $config)
+    {
+        parent::__construct($name, $config);
+        $this->apiurl = rtrim($config['ollama_baseurl'] ?? '', '/');
+        if ($this->apiurl === '') {
+            throw new \Exception('Ollama base URL not configured');
+        }
+    }
+
+    /**
+     * Send a request to the OpenAI API
+     *
+     * @param string $endpoint
+     * @param array $data Payload to send
+     * @return array API response
+     * @throws \Exception
+     */
+    protected function request($endpoint, $data)
+    {
+        $url = $this->apiurl . '/' . ltrim($endpoint, '/');
+        return $this->sendAPIRequest('POST', $url, $data);
+    }
+
+    /** @inheritdoc */
+    protected function parseAPIResponse($response)
+    {
+        if (isset($response['eval_count'])) {
+            $this->inputTokensUsed += $response['eval_count'];
+        }
+
+        if (isset($response['error'])) {
+            $error = is_array($response['error']) ? $response['error']['message'] : $response['error'];
+            throw new \Exception('Ollama API error: ' . $error);
+        }
+
+        return $response;
+    }
+
+}
diff --git a/Model/Ollama/ChatModel.php b/Model/Ollama/ChatModel.php
@@ -0,0 +1,20 @@
+<?php
+
+namespace dokuwiki\plugin\aichat\Model\Ollama;
+
+use dokuwiki\plugin\aichat\Model\ChatInterface;
+
+class ChatModel extends AbstractOllama implements ChatInterface
+{
+    /** @inheritdoc */
+    public function getAnswer(array $messages): string
+    {
+        $data = [
+            'messages' => $messages,
+            'model' => $this->getModelName(),
+            'stream' => false,
+        ];
+        $response = $this->request('chat', $data);
+        return $response['message']['content'];
+    }
+}
diff --git a/Model/Ollama/EmbeddingModel.php b/Model/Ollama/EmbeddingModel.php
@@ -0,0 +1,20 @@
+<?php
+
+namespace dokuwiki\plugin\aichat\Model\Ollama;
+
+use dokuwiki\plugin\aichat\Model\EmbeddingInterface;
+
+class EmbeddingModel extends AbstractOllama implements EmbeddingInterface
+{
+    /** @inheritdoc */
+    public function getEmbedding($text): array
+    {
+        $data = [
+            'model' => $this->getModelName(),
+            'prompt' => $text,
+        ];
+        $response = $this->request('embeddings', $data);
+
+        return $response['embedding'];
+    }
+}
diff --git a/Model/Ollama/models.json b/Model/Ollama/models.json
@@ -0,0 +1,27 @@
+{
+    "chat": {
+        "llama2": {
+            "description": "Llama 2 is released by Meta Platforms, Inc. This model is trained on 2 trillion tokens, and by default supports a context length of 4096. Llama 2 Chat models are fine-tuned on over 1 million human annotations, and are made for chat.",
+            "inputTokens": 4096,
+            "inputTokenPrice": 0,
+            "outputTokens": 4096,
+            "outputTokenPrice": 0
+        },
+
+        "gemma": {
+            "description": "Llama 2 is released by Meta Platforms, Inc. This model is trained on 2 trillion tokens, and by default supports a context length of 4096. Llama 2 Chat models are fine-tuned on over 1 million human annotations, and are made for chat.",
+            "inputTokens": 4096,
+            "inputTokenPrice": 0,
+            "outputTokens": 4096,
+            "outputTokenPrice": 0
+        }
+    },
+    "embedding": {
+        "text-embedding-ada-002": {
+            "description": "Most capable 2nd generation embedding model",
+            "inputTokens": 8192,
+            "inputTokenPrice": 0.10,
+            "dimensions": 1536
+        }
+    }
+}
diff --git a/conf/default.php b/conf/default.php
@@ -22,6 +22,8 @@
 
 $conf['reka_apikey'] = '';
 
+$conf['groq_apikey'] = '';
+
 $conf['pinecone_apikey'] = '';
 $conf['pinecone_baseurl'] = '';
 
diff --git a/conf/metadata.php b/conf/metadata.php
@@ -29,6 +29,8 @@
 
 $meta['reka_apikey'] = array('password');
 
+$meta['groq_apikey'] = array('password');
+
 $meta['pinecone_apikey'] = array('password');
 $meta['pinecone_baseurl'] = array('string');
 
diff --git a/lang/en/settings.php b/lang/en/settings.php
@@ -18,6 +18,7 @@
 $lang['mistral_apikey'] = '🧠 <b>Mistral</b> API key';
 $lang['voyageai_apikey'] = '🧠 <b>Voyage AI</b> API key';
 $lang['reka_apikey'] = '🧠 <b>Reka</b> API key';
+$lang['groq_apikey'] = '🧠 <b>Groq</b> API key';
 
 $lang['pinecone_apikey'] = '📥 <b>Pinecone</b> API key';
 $lang['pinecone_baseurl'] = '📥 <b>Pinecone</b> base URL';