Update ai_logic.py

SudoACoder · web-flow · commit 8f95ec6909fd · 2024-02-24T21:10:01.000+03:30
+ Support for local LLM models
diff --git a/ai_logic.py b/ai_logic.py
@@ -3,28 +3,34 @@
 from sklearn.decomposition import TruncatedSVD
 from utils import *
 import matplotlib.pyplot as plt
+import matplotlib
+matplotlib.use('QtAgg')
 
 class AI(object):
-    def __init__(self, OPENAI_API_KEY, model_type):
+    def __init__(self, OPENAI_API_KEY, model_type, llm_model):
         # Initialize OpenAI client and model
-        self.client, self.model = initialize_openai_and_embedding(OPENAI_API_KEY, model_type)
-
+        self.client, self.model = initialize_openai_and_embedding(OPENAI_API_KEY, model_type, llm_model)
+        self.llm_model = llm_model
+    
     def content_embedding(self, content):
         return self.model.encode(content).tolist()
 
     def clustering(self, allowed_type, txt_files, pdf_files, docx_files, num_clusters):
         # Clustering logic
         contents = []
+        C_path = []
         if allowed_type == "txt" or allowed_type == "all":
             for file in txt_files:
                 with open(file, 'r', encoding='utf-8') as f:
                     contents.append(f.read())
+                    C_path.append(basename(file))
 
         if allowed_type == "pdf" or allowed_type == "all":
             for file in pdf_files:
                 try:
                     pdf_text = read_pdf(file)
                     contents.append(pdf_text)
+                    C_path.append(basename(file))
                 except Exception as e:
                     write_log(f"Warning: Error reading PDF file: {e}")
 
@@ -33,6 +39,7 @@ def clustering(self, allowed_type, txt_files, pdf_files, docx_files, num_cluster
                 try:
                     docx_text = read_docx(file)
                     contents.append(docx_text)
+                    C_path.append(basename(file))
                 except Exception as e:
                     write_log(f"Warning: Error reading DOCX file: {e}")
         
@@ -51,12 +58,9 @@ def clustering(self, allowed_type, txt_files, pdf_files, docx_files, num_cluster
         for i in range(num_clusters):
             plt.scatter(X_svd[y_kmeans == i, 0], X_svd[y_kmeans == i, 1], label=f'Cluster {i+1}')
 
-        '''for i, txt_file in enumerate(txt_files + pdf_files):
-            plt.annotate(basename(txt_file), (X_svd[i, 0], X_svd[i, 1]))'''
-
-        for i in range(len(X_svd)): 
-            plt.annotate(basename(txt_files[i % len(txt_files)]), (X_svd[i, 0], X_svd[i, 1]))  # Use modulo operator to loop over txt_files
-
+        for i in range(len(contents)):
+            plt.annotate(C_path[i], (X_svd[i, 0], X_svd[i, 1]))
+        
         plt.title('Clustering of Text Files Content')
         plt.xlabel('Feature 1')
         plt.ylabel('Feature 2')
@@ -94,18 +98,22 @@ def keyword_search(self, allowed_type, txt_files, pdf_files, docx_files, keyword
 
         return results
     
-    def chat_interaction(self, openaiclient, msg, selected_note_files, chat_history):
+    def chat_interaction(self, msg, selected_note_files, chat_history):
         # Chat interaction logic
         notes_text = ""
         for file in selected_note_files:
             with open(file, 'r', encoding='utf-8') as f:
                 notes_text += f.read() + "\n"
-        
-        response = openaiclient.chat.completions.create(
-                        model="gpt-3.5-turbo",
-                        messages=[
-                            {"role": "system", "content": "Answer the users question based on the notes.(answer only one sentence(15-20 words))"},
-                            {"role": "user", "content": f"Notes: \n{notes_text}"}] + chat_history + [{"role": "user", "content": msg}], max_tokens=41)
-
-        chatbot_response = response.choices[0].message.content.strip()
-        return chatbot_response
+        if self.llm_model in ["Tinyllama(Q5)", "Llama2-7B(Q4)"]:
+            history_str = '\n'.join([f"{c['role']}: {c['content']}" for c in chat_history])
+            prompt = f"""Answer the user question based on the following notes.(answer max one sentence(15-20 words)\n\nNotes: \n{notes_text}\n\n{history_str}\nuser: {msg}\nassistant: """
+            chatbot_response = self.client(prompt, temperature=0.7, max_new_tokens=41, stop=['assistant:','user:'], threads=4)
+        else: 
+            response = self.client.chat.completions.create(
+                            model="gpt-3.5-turbo",
+                            messages=[
+                                {"role": "system", "content": "Answer the user question based on the notes.(answer max one sentence(15-20 words)"},
+                                {"role": "user", "content": f"Notes: \n{notes_text}"}] + chat_history + [{"role": "user", "content": msg}], max_tokens=41)
+
+            chatbot_response = response.choices[0].message.content
+        return chatbot_response.strip()