Skip to content

Commit efa152a

Browse files
factor out new cache-aware rebuild_embeddings
1 parent 5abb50d commit efa152a

File tree

1 file changed

+8
-5
lines changed

1 file changed

+8
-5
lines changed

app/rag_system.py

Lines changed: 8 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -25,13 +25,16 @@ def __init__(self, knowledge_base_path='./data/knowledge_base.json'):
2525
self.doc_embeddings = np.load('./data/doc_embeddings.npy')
2626
logging.info("Loaded existing document embeddings from disk.")
2727
else:
28-
logging.info("No existing document embeddings found, creating new embeddings.")
29-
self.doc_embeddings = self.embed_knowledge_base()
30-
# cache doc_embeddings to disk
31-
np.save('./data/doc_embeddings.npy', self.doc_embeddings.cpu().numpy())
28+
self.rebuild_embeddings()
3229
logging.info("Knowledge base embeddings created")
3330
self.conversation_history = []
3431

32+
def rebuild_embeddings(self):
33+
logging.info("No existing document embeddings found, creating new embeddings.")
34+
self.doc_embeddings = self.embed_knowledge_base()
35+
# cache doc_embeddings to disk
36+
np.save('./data/doc_embeddings.npy', self.doc_embeddings.cpu().numpy())
37+
3538
def load_knowledge_base(self):
3639
with open(self.knowledge_base_path, 'r') as kb_file:
3740
return json.load(kb_file)
@@ -183,7 +186,7 @@ def rebuild(self):
183186
"""
184187
print("Rebuilding embeddings for the knowledge base...")
185188
self.knowledge_base = self.load_knowledge_base() # Reload the knowledge base
186-
self.doc_embeddings = self.embed_knowledge_base() # Rebuild the embeddings
189+
self.doc_embeddings = self.rebuild_embeddings() # Rebuild the embeddings
187190
print("Embeddings have been rebuilt.")
188191

189192
def get_citations(self, retrieved_docs):

0 commit comments

Comments
 (0)