66 @date:2023/10/20 14:01
77 @desc:
88"""
9- import logging
109import os
1110import threading
1211import datetime
2221from common .db .search import native_search , get_dynamics_model , native_update
2322from common .utils .common import get_file_content
2423from common .utils .lock import try_lock , un_lock
24+ from common .utils .logger import maxkb_logger , maxkb_error_logger
2525from common .utils .page_utils import page_desc
2626from knowledge .models import Paragraph , Status , Document , ProblemParagraphMapping , TaskType , State ,SourceType , SearchMode
2727from maxkb .conf import (PROJECT_DIR )
2828from django .utils .translation import gettext_lazy as _
2929
30- max_kb_error = logging .getLogger (__file__ )
31- max_kb = logging .getLogger (__file__ )
30+
3231lock = threading .Lock ()
3332
3433
@@ -87,12 +86,12 @@ def embedding_by_paragraph_list(paragraph_id_list, embedding_model: Embeddings):
8786 ListenerManagement .embedding_by_paragraph_data_list (data_list , paragraph_id_list = paragraph_id_list ,
8887 embedding_model = embedding_model )
8988 except Exception as e :
90- max_kb_error .error (_ ('Query vector data: {paragraph_id_list} error {error} {traceback}' ).format (
89+ maxkb_error_logger .error (_ ('Query vector data: {paragraph_id_list} error {error} {traceback}' ).format (
9190 paragraph_id_list = paragraph_id_list , error = str (e ), traceback = traceback .format_exc ()))
9291
9392 @staticmethod
9493 def embedding_by_paragraph_data_list (data_list , paragraph_id_list , embedding_model : Embeddings ):
95- max_kb .info (_ ('Start--->Embedding paragraph: {paragraph_id_list}' ).format (paragraph_id_list = paragraph_id_list ))
94+ maxkb_logger .info (_ ('Start--->Embedding paragraph: {paragraph_id_list}' ).format (paragraph_id_list = paragraph_id_list ))
9695 status = Status .success
9796 try :
9897 # 删除段落
@@ -104,12 +103,12 @@ def is_save_function():
104103 # 批量向量化
105104 VectorStore .get_embedding_vector ().batch_save (data_list , embedding_model , is_save_function )
106105 except Exception as e :
107- max_kb_error .error (_ ('Vectorized paragraph: {paragraph_id_list} error {error} {traceback}' ).format (
106+ maxkb_error_logger .error (_ ('Vectorized paragraph: {paragraph_id_list} error {error} {traceback}' ).format (
108107 paragraph_id_list = paragraph_id_list , error = str (e ), traceback = traceback .format_exc ()))
109108 status = Status .error
110109 finally :
111110 QuerySet (Paragraph ).filter (id__in = paragraph_id_list ).update (** {'status' : status })
112- max_kb .info (
111+ maxkb_logger .info (
113112 _ ('End--->Embedding paragraph: {paragraph_id_list}' ).format (paragraph_id_list = paragraph_id_list ))
114113
115114 @staticmethod
@@ -119,7 +118,7 @@ def embedding_by_paragraph(paragraph_id, embedding_model: Embeddings):
119118 @param paragraph_id: 段落id
120119 @param embedding_model: 向量模型
121120 """
122- max_kb .info (_ ('Start--->Embedding paragraph: {paragraph_id}' ).format (paragraph_id = paragraph_id ))
121+ maxkb_logger .info (_ ('Start--->Embedding paragraph: {paragraph_id}' ).format (paragraph_id = paragraph_id ))
123122 # 更新到开始状态
124123 ListenerManagement .update_status (QuerySet (Paragraph ).filter (id = paragraph_id ), TaskType .EMBEDDING , State .STARTED )
125124 try :
@@ -144,12 +143,12 @@ def is_the_task_interrupted():
144143 ListenerManagement .update_status (QuerySet (Paragraph ).filter (id = paragraph_id ), TaskType .EMBEDDING ,
145144 State .SUCCESS )
146145 except Exception as e :
147- max_kb_error .error (_ ('Vectorized paragraph: {paragraph_id} error {error} {traceback}' ).format (
146+ maxkb_error_logger .error (_ ('Vectorized paragraph: {paragraph_id} error {error} {traceback}' ).format (
148147 paragraph_id = paragraph_id , error = str (e ), traceback = traceback .format_exc ()))
149148 ListenerManagement .update_status (QuerySet (Paragraph ).filter (id = paragraph_id ), TaskType .EMBEDDING ,
150149 State .FAILURE )
151150 finally :
152- max_kb .info (_ ('End--->Embedding paragraph: {paragraph_id}' ).format (paragraph_id = paragraph_id ))
151+ maxkb_logger .info (_ ('End--->Embedding paragraph: {paragraph_id}' ).format (paragraph_id = paragraph_id ))
153152
154153 @staticmethod
155154 def embedding_by_data_list (data_list : List , embedding_model : Embeddings ):
@@ -265,7 +264,7 @@ def is_the_task_interrupted():
265264
266265 if is_the_task_interrupted ():
267266 return
268- max_kb .info (_ ('Start--->Embedding document: {document_id}' ).format (document_id = document_id )
267+ maxkb_logger .info (_ ('Start--->Embedding document: {document_id}' ).format (document_id = document_id )
269268 )
270269 # 批量修改状态为PADDING
271270 ListenerManagement .update_status (QuerySet (Document ).filter (id = document_id ), TaskType .EMBEDDING ,
@@ -285,12 +284,12 @@ def is_the_task_interrupted():
285284 document_id )),
286285 is_the_task_interrupted )
287286 except Exception as e :
288- max_kb_error .error (_ ('Vectorized document: {document_id} error {error} {traceback}' ).format (
287+ maxkb_error_logger .error (_ ('Vectorized document: {document_id} error {error} {traceback}' ).format (
289288 document_id = document_id , error = str (e ), traceback = traceback .format_exc ()))
290289 finally :
291290 ListenerManagement .post_update_document_status (document_id , TaskType .EMBEDDING )
292291 ListenerManagement .get_aggregation_document_status (document_id )()
293- max_kb .info (_ ('End--->Embedding document: {document_id}' ).format (document_id = document_id ))
292+ maxkb_logger .info (_ ('End--->Embedding document: {document_id}' ).format (document_id = document_id ))
294293 un_lock ('embedding' + str (document_id ))
295294
296295 @staticmethod
@@ -301,18 +300,18 @@ def embedding_by_knowledge(knowledge_id, embedding_model: Embeddings):
301300 @param embedding_model 向量模型
302301 :return: None
303302 """
304- max_kb .info (_ ('Start--->Embedding knowledge: {knowledge_id}' ).format (knowledge_id = knowledge_id ))
303+ maxkb_logger .info (_ ('Start--->Embedding knowledge: {knowledge_id}' ).format (knowledge_id = knowledge_id ))
305304 try :
306305 ListenerManagement .delete_embedding_by_knowledge (knowledge_id )
307306 document_list = QuerySet (Document ).filter (knowledge_id = knowledge_id )
308- max_kb .info (_ ('Start--->Embedding document: {document_list}' ).format (document_list = document_list ))
307+ maxkb_logger .info (_ ('Start--->Embedding document: {document_list}' ).format (document_list = document_list ))
309308 for document in document_list :
310309 ListenerManagement .embedding_by_document (document .id , embedding_model = embedding_model )
311310 except Exception as e :
312- max_kb_error .error (_ ('Vectorized knowledge: {knowledge_id} error {error} {traceback}' ).format (
311+ maxkb_error_logger .error (_ ('Vectorized knowledge: {knowledge_id} error {error} {traceback}' ).format (
313312 knowledge_id = knowledge_id , error = str (e ), traceback = traceback .format_exc ()))
314313 finally :
315- max_kb .info (_ ('End--->Embedding knowledge: {knowledge_id}' ).format (knowledge_id = knowledge_id ))
314+ maxkb_logger .info (_ ('End--->Embedding knowledge: {knowledge_id}' ).format (knowledge_id = knowledge_id ))
316315
317316 @staticmethod
318317 def delete_embedding_by_document (document_id ):
0 commit comments