lmstudio-memory-chat/chat_ui_gradio.py at main · mbuckingham74/lmstudio-memory-chat · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
import gradio as gr
import os
from langchain_openai import ChatOpenAI
import requests
from bs4 import BeautifulSoup
import re
import chromadb
import uuid

# Initialize Chroma
client = chromadb.PersistentClient(path="./chroma_db")
collection = client.get_or_create_collection(name="engineering_memory")

# LM Studio connection
LM_STUDIO_URL = os.getenv("LM_STUDIO_URL", "http://host.docker.internal:1234")

llm = ChatOpenAI(
    base_url=f"{LM_STUDIO_URL}/v1",
    api_key="not-needed",
    model="local-model"
)

# Memory functions
def add_memory(text):
    if not text.strip():
        return "Please enter some text to save."
    memory_id = str(uuid.uuid4())
    collection.add(
        documents=[text],
        ids=[memory_id]
    )
    return f"✓ Memory saved: {text[:50]}..."

def search_memory(query, n_results=3):
    if not query.strip():
        return "Please enter a search query."
    results = collection.query(query_texts=[query], n_results=n_results)
    if results['documents'][0]:
        found = "\n".join([f"• {mem}" for mem in results['documents'][0]])
        return f"**Found memories:**\n{found}"
    return "No memories found."

# Web fetching function
def fetch_webpage(url: str) -> str:
    url = url.strip()
    url_match = re.search(r'https?://[^\s\'"}\]]+', url)
    if url_match:
        url = url_match.group(0)

    try:
        response = requests.get(url, timeout=10, headers={'User-Agent': 'Mozilla/5.0'})
        soup = BeautifulSoup(response.content, 'html.parser')
        for script in soup(["script", "style"]):
            script.decompose()
        text = soup.get_text()
        lines = (line.strip() for line in text.splitlines())
        text = '\n'.join(line for line in lines if line)
        return text[:3000] if text else "No content found"
    except Exception as e:
        return f"Error fetching webpage: {str(e)}"

def respond(message, chat_history):
    # Check for relevant memories
    relevant_memories = collection.query(query_texts=[message], n_results=3)
    memories = relevant_memories['documents'][0] if relevant_memories['documents'][0] else []

    # Build conversation history for context
    conversation = ""
    if chat_history:
        for user_msg, bot_msg in chat_history[-5:]:
            conversation += f"User: {user_msg}\nAssistant: {bot_msg}\n\n"

    # Build prompt
    full_prompt = ""

    if memories:
        context = "\n".join([f"- {mem}" for mem in memories])
        full_prompt += f"Relevant knowledge from memory:\n{context}\n\n"

    if conversation:
        full_prompt += f"Recent conversation:\n{conversation}\n"

    full_prompt += f"User: {message}"

    # Check for URL
    url_match = re.search(r'https?://[^\s]+', message)
    if url_match:
        url = url_match.group(0)
        webpage_content = fetch_webpage(url)
        full_prompt += f"\n\nWebpage content from {url}:\n{webpage_content}"

    try:
        response = llm.invoke(full_prompt)
        bot_message = response.content
    except Exception as e:
        bot_message = f"Error: {str(e)}"

    chat_history.append([message, bot_message])
    return "", chat_history

# Build Gradio interface
with gr.Blocks(title="Local LLM Chat") as demo:
    gr.Markdown("# 🤖 Local LLM Chat with Memory & Web Access")

    with gr.Row():
        with gr.Column(scale=3):
            chatbot = gr.Chatbot(value=[], height=600)
            with gr.Row():
                msg = gr.Textbox(
                    placeholder="Ask me anything (include URLs to fetch webpages)...",
                    show_label=False,
                    scale=9
                )
                submit = gr.Button("Send", scale=1, variant="primary")

        with gr.Column(scale=1):
            gr.Markdown("### Memory Management")

            with gr.Group():
                gr.Markdown("**Add to memory:**")
                memory_input = gr.Textbox(
                    placeholder="Enter information to remember...",
                    show_label=False,
                    lines=3
                )
                save_btn = gr.Button("Save Memory", variant="primary")
                memory_status = gr.Markdown()

            gr.Markdown("---")

            with gr.Group():
                gr.Markdown("**Search memories:**")
                search_input = gr.Textbox(
                    placeholder="Search...",
                    show_label=False
                )
                search_btn = gr.Button("Search")
                search_results = gr.Markdown()

    # Event handlers
    msg.submit(respond, [msg, chatbot], [msg, chatbot])
    submit.click(respond, [msg, chatbot], [msg, chatbot])

    save_btn.click(add_memory, [memory_input], [memory_status])
    save_btn.click(lambda: "", None, [memory_input])

    search_btn.click(search_memory, [search_input], [search_results])

if __name__ == "__main__":
    demo.launch(server_name="0.0.0.0", server_port=7860)