Skip to content

Commit 381ad83

Browse files
[FIX] Delete Vector DB nodes after extraction (#100)
Delete nodes after extraction Signed-off-by: Deepak <[email protected]>
1 parent 4d69936 commit 381ad83

File tree

2 files changed

+14
-15
lines changed

2 files changed

+14
-15
lines changed

src/unstract/sdk/__init__.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
__version__ = "0.48.1"
1+
__version__ = "0.48.2"
22

33

44
def get_sdk_version():

src/unstract/sdk/index.py

Lines changed: 13 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -203,20 +203,7 @@ def index(
203203
level=LogLevel.ERROR,
204204
)
205205

206-
if doc_id_found and reindex:
207-
# Delete the nodes for the doc_id
208-
try:
209-
vector_db.delete(ref_doc_id=doc_id)
210-
self.tool.stream_log(f"Deleted nodes for {doc_id}")
211-
except Exception as e:
212-
self.tool.stream_log(
213-
f"Error deleting nodes for {doc_id}: {e}",
214-
level=LogLevel.ERROR,
215-
)
216-
raise SdkError(f"Error deleting nodes for {doc_id}: {e}") from e
217-
doc_id_found = False
218-
219-
if doc_id_found:
206+
if doc_id_found and not reindex:
220207
self.tool.stream_log(f"File was indexed already under {doc_id}")
221208
return doc_id
222209

@@ -287,6 +274,18 @@ def index(
287274
documents.append(document)
288275
self.tool.stream_log(f"Number of documents: {len(documents)}")
289276

277+
if doc_id_found:
278+
# Delete the nodes for the doc_id
279+
try:
280+
vector_db.delete(ref_doc_id=doc_id)
281+
self.tool.stream_log(f"Deleted nodes for {doc_id}")
282+
except Exception as e:
283+
self.tool.stream_log(
284+
f"Error deleting nodes for {doc_id}: {e}",
285+
level=LogLevel.ERROR,
286+
)
287+
raise SdkError(f"Error deleting nodes for {doc_id}: {e}") from e
288+
290289
try:
291290
if chunk_size == 0:
292291
parser = SentenceSplitter.from_defaults(

0 commit comments

Comments
 (0)