doc-rag/qa_system.py at master · kundu/doc-rag · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
import os
import json
import numpy as np
import requests
from dotenv import load_dotenv
from sqlalchemy import create_engine
from sqlalchemy.orm import sessionmaker
from models import Base, PDFFile, PDFEmbedding
from rich.console import Console
from rich.panel import Panel
from rich.markdown import Markdown

# Initialize Rich console
console = Console()

# Load environment variables
load_dotenv()

# Database configuration
DB_USER = os.getenv('DB_USER')
DB_PASSWORD = os.getenv('DB_PASSWORD')
DB_HOST = os.getenv('DB_HOST')
DB_PORT = os.getenv('DB_PORT')
DB_NAME = os.getenv('DB_NAME')

# AI API configuration
EMBEDDING_API_URL = os.getenv('AI_API_URL')
EMBEDDING_MODEL = os.getenv('AI_MODEL')
QA_API_URL = os.getenv('QA_API_URL')
QA_MODEL = os.getenv('QA_MODEL')
POD_API_KEY = os.getenv('POD_API_KEY')

# Create database connection
DATABASE_URL = f"postgresql://{DB_USER}:{DB_PASSWORD}@{DB_HOST}:{DB_PORT}/{DB_NAME}"
engine = create_engine(DATABASE_URL)
Session = sessionmaker(bind=engine)

def get_embedding(text, context=None):
    """Get embedding from the AI API with optional context."""
    try:
        input_text = text
        if context:
            input_text = f"{context}: {text}"

        response = requests.post(
            EMBEDDING_API_URL,
            headers={"Content-Type": "application/json", "Authorization": f"Bearer {POD_API_KEY}"},
            json={
                "model": EMBEDDING_MODEL,
                "input": input_text
            }
        )
        response.raise_for_status()
        return response.json()['data'][0]['embedding']
    except Exception as e:
        console.print(f"[red]Error getting embedding: {e}[/red]")
        return None

def cosine_similarity(a, b):
    """Calculate cosine similarity between two vectors."""
    return np.dot(a, b) / (np.linalg.norm(a) * np.linalg.norm(b))

def search_similar_content(query, limit=5):
    """Search for similar content in the database."""
    try:
        session = Session()

        # Get query embedding
        query_embedding = get_embedding(query)
        if not query_embedding:
            return []

        # Get all embeddings from database
        results = session.query(PDFEmbedding, PDFFile).join(PDFFile).all()

        # Calculate similarities
        similarities = []
        for result in results:
            embedding = result.PDFEmbedding.embedding
            if embedding:
                similarity = cosine_similarity(
                    np.array(query_embedding),
                    np.array(embedding)
                )

                similarities.append({
                    'similarity': similarity,
                    'content': result.PDFEmbedding.page_content,
                    'file_name': result.PDFFile.filename,
                    'page_number': result.PDFEmbedding.page_number,
                    'metadata': {
                        'file_name': result.PDFFile.filename,
                        'page': result.PDFEmbedding.page_number,
                        'type': result.PDFEmbedding.content_type.value if result.PDFEmbedding.content_type else 'unknown',
                        'level': result.PDFEmbedding.hierarchy_level.value if result.PDFEmbedding.hierarchy_level else 'unknown'
                    }
                })

        # Sort by similarity
        similarities.sort(key=lambda x: x['similarity'], reverse=True)
        return similarities[:limit]

    except Exception as e:
        console.print(f"[red]Error searching: {e}[/red]")
        return []
    finally:
        session.close()

def get_llm_response(query, context_docs):
    """Get response from LLM using the context."""
    try:
        # Prepare context
        context = "\n\n".join([
            f"Document: {doc['file_name']} (Page {doc['page_number']})\n{doc['content']}"
            for doc in context_docs
        ])

        # Prepare messages for the LLM
        messages = [
            {
                "role": "system",
                "content": (
                    "You are a friendly and helpful customer service representative named Alex. Respond to customer queries about our product "
                    "in a conversational, professional manner. Follow these guidelines:\n\n"
                    "1. Start responses with a warm greeting and acknowledge the customer's question\n"
                    "2. Use a friendly, professional tone throughout your response\n"
                    "3. Structure your responses like this:\n"
                    "   - Greeting and acknowledgment\n"
                    "   - Clear, direct answer\n"
                    "   - Supporting details from our documentation\n"
                    "   - Helpful suggestions or related information\n"
                    "   - Offer for additional assistance\n\n"
                    "4. When providing product information:\n"
                    "   - Use simple, clear language\n"
                    "   - Break down complex technical details into understandable terms\n"
                    "   - Support your answers with documentation, cited as:\n"
                    "     > [relevant information]\n"
                    "     (From: [document name], Page [number])\n\n"
                    "5. For technical or troubleshooting questions:\n"
                    "   - Provide easy-to-follow, step-by-step instructions\n"
                    "   - Explain what each step accomplishes\n"
                    "   - Offer alternative solutions when available\n\n"
                    "6. When discussing limitations or issues:\n"
                    "   - Be honest but positive\n"
                    "   - Focus on what can be done\n"
                    "   - Provide workarounds when possible\n\n"
                    "7. Always end your response by:\n"
                    "   - Asking if they need any clarification\n"
                    "   - Inviting them to ask more questions\n"
                    "   - Thanking them for choosing our product\n\n"
                    "Remember to maintain a helpful, positive tone while being accurate and honest about product information."
                )
            },
            {
                "role": "user",
                "content": f"Context:\n{context}\n\nQuestion: {query}\n\nPlease answer the question based on the context provided, maintaining a friendly customer service tone."
            }
        ]


        # messages = [
        #     {
        #         "role": "system",
        #         "content": (
        #              "You are a Prop Firm Specialist. Respond to questions about our proprietary trading firm's policies, procedures, and offerings in a professional, informative manner. Follow these guidelines:\n\n"
        #                 "1. Start responses with a clear and concise introduction\n"
        #                 "2. Provide detailed, accurate information about our firm's policies and procedures\n"
        #                 "3. Use a professional, objective tone throughout your response\n"
        #                 "4. Structure your responses like this:\n"
        #                 "   - Introduction and context\n"
        #                 "   - Clear, detailed information\n"
        #                 "   - Supporting documentation or resources\n"
        #                 "   - Additional information or next steps\n"
        #                 "5. When discussing firm policies or procedures:\n"
        #                 "   - Provide step-by-step explanations\n"
        #                 "   - Clarify any ambiguities or exceptions\n"
        #                 "   - Offer resources for further information\n\n"
        #                 "6. Always end your response by:\n"
        #                 "   - Summarizing key points\n"
        #                 "   - Encouraging further questions or clarification\n"
        #                 "   - Thanking the user for their interest in our firm"
        #         )
        #     },
        #     {
        #         "role": "user",
        #         "content": f"Context:\n{context}\n\nQuestion: {query}\n\nPlease answer the question based on the context provided, maintaining a friendly customer service tone."
        #     }
        # ]


        # Call the LLM API
        response = requests.post(
            QA_API_URL,
            headers={"Content-Type": "application/json", "Authorization": f"Bearer {POD_API_KEY}"},
            json={
                "model": QA_MODEL,
                "messages": messages,
                "temperature": 0.3,
                "max_tokens": 4000,
                "top_p": 0.8,
                "stream": False
            }
        )
        response.raise_for_status()

        # Extract and return the response
        return response.json()['choices'][0]['message']['content']

    except Exception as e:
        console.print(f"[red]Error getting LLM response: {e}[/red]")
        return f"Error: Could not generate response. {str(e)}"

def main():
    """Main QA loop."""
    console.print(Panel.fit("PDF Question Answering System", style="bold magenta"))

    while True:
        try:
            # Get question from user
            console.print("\n[cyan]Enter your question (or 'quit' to exit):[/cyan]")
            query = input().strip()

            if query.lower() in ['quit', 'exit', 'q']:
                break

            console.print("\n[cyan]Searching for relevant content...[/cyan]")

            # Search for relevant content
            results = search_similar_content(query)

            if not results:
                console.print("[yellow]No relevant content found.[/yellow]")
                continue

            # Get LLM response
            console.print("\n[cyan]Generating answer...[/cyan]")
            response = get_llm_response(query, results)

            # Display results
            console.print("\n[bold]Answer:[/bold]")
            console.print(Markdown(response))

            # Display sources
            console.print("\n[bold]Sources:[/bold]")
            for result in results:
                console.print(f"- {result['file_name']} (Page {result['page_number']}) [Similarity: {result['similarity']:.2f}]")

        except KeyboardInterrupt:
            break
        except Exception as e:
            console.print(f"[red]Error: {e}[/red]")
            continue

    console.print("\n[cyan]Thank you for using the PDF QA System![/cyan]")

if __name__ == "__main__":
    main()