@@ -62,7 +62,7 @@ def create_source_node_graph_local_file(uri, userName, password, file, model, db
6262 logging .error (f"Error in creating document node: { error_message } " )
6363 return create_api_response (job_status , message = message ,error = error_message ,file_source = obj_source_node .source ,file_name = obj_source_node .file_name )
6464
65- def create_source_node_graph_url (uri , userName , password ,model , source_url = None , db_name = None ,wiki_query :List [ str ] = None ,aws_access_key_id = None ,aws_secret_access_key = None , gcs_bucket_name = None , gcs_bucket_folder = None ):
65+ def create_source_node_graph_url (uri , userName , password ,model , source_url = None , db_name = None , wiki_query :str = None , aws_access_key_id = None ,aws_secret_access_key = None , gcs_bucket_name = None , gcs_bucket_folder = None ):
6666 """
6767 Creates a source node in Neo4jGraph and sets properties.
6868
@@ -157,16 +157,19 @@ def create_source_node_graph_url(uri, userName, password ,model, source_url=None
157157 source_type = 'text'
158158 job_status = 'Completed'
159159 pages = WikipediaLoader (query = query .strip (), load_max_docs = 1 , load_all_available_meta = True ).load ()
160- obj_source_node = sourceNode ()
161- obj_source_node .file_name = query .strip ()
162- obj_source_node .file_type = source_type
163- obj_source_node .file_source = 'Wikipedia'
164- obj_source_node .file_size = sys .getsizeof (pages [0 ].page_content )
165- obj_source_node .model = model
166- obj_source_node .url = pages [0 ].metadata ['source' ]
167- obj_source_node .created_at = datetime .now ()
168- obj_source_node .status = 'New'
169160 try :
161+ if not pages :
162+ Failed_count += 1
163+ continue
164+ obj_source_node = sourceNode ()
165+ obj_source_node .file_name = query .strip ()
166+ obj_source_node .file_type = source_type
167+ obj_source_node .file_source = 'Wikipedia'
168+ obj_source_node .file_size = sys .getsizeof (pages [0 ].page_content )
169+ obj_source_node .model = model
170+ obj_source_node .url = pages [0 ].metadata ['source' ]
171+ obj_source_node .created_at = datetime .now ()
172+ obj_source_node .status = 'New'
170173 graphDb_data_Access = graphDBdataAccess (graph )
171174 graphDb_data_Access .create_source_node (obj_source_node )
172175 success_count += 1
@@ -273,9 +276,17 @@ def extract_graph_from_file(uri, userName, password, model, db_name=None, file=N
273276 logging .error (f"Pdf content or Youtube transcript is not available" )
274277 graphDb_data_Access .update_exception_db (file_name ,message )
275278 return create_api_response (job_status ,message = message ,file_name = file_name )
276-
277- # update_node_prop = "SET d.createdAt ='{}', d.updatedAt = '{}', d.processingTime = '{}',d.status = '{}', d.errorMessage = '{}',d.nodeCount= {}, d.relationshipCount = {}, d.model = '{}'"
278- # pages = loader.load_and_split()
279+
280+ obj_source_node = sourceNode ()
281+ status = "Processing"
282+ obj_source_node .file_name = file_name
283+ obj_source_node .status = status
284+ obj_source_node .created_at = start_time
285+ obj_source_node .updated_at = start_time
286+ logging .info (file_name )
287+ logging .info (obj_source_node )
288+ # graphDb_data_Access.update_source_node(obj_source_node)
289+
279290 full_document_content = ""
280291 bad_chars = ['"' , "\n " , "'" ]
281292 for i in range (0 ,len (pages )):
@@ -336,7 +347,6 @@ def extract_graph_from_file(uri, userName, password, model, db_name=None, file=N
336347 obj_source_node .node_count = nodes_created
337348 obj_source_node .relationship_count = relationships_created
338349
339- graphDb_data_Access = graphDBdataAccess (graph )
340350 graphDb_data_Access .update_source_node (obj_source_node )
341351
342352 output = {
0 commit comments