@@ -227,8 +227,7 @@ def _parse_edges_from_llm_data(
227227 target_ref = target_ref ,
228228 evidence = evidence ,
229229 utterance_ids = utterance_ids ,
230- earliest_timestamp = earliest_timestamp_str
231- or window .earliest_timestamp ,
230+ earliest_timestamp = earliest_timestamp_str or window .earliest_timestamp ,
232231 earliest_seconds = earliest_seconds or window .earliest_seconds ,
233232 confidence = float (edge_data .get ("confidence" , 0.5 )),
234233 )
@@ -295,9 +294,7 @@ def canonicalize_and_store(
295294 ) -> dict [str , Any ]:
296295 """Canonicalize nodes and edges and store them in Postgres."""
297296
298- def _normalize_speaker_ref (
299- ref : str , window_speaker_ids : list [str ]
300- ) -> str | None :
297+ def _normalize_speaker_ref (ref : str , window_speaker_ids : list [str ]) -> str | None :
301298 ref = (ref or "" ).strip ()
302299 if not ref :
303300 return None
@@ -353,9 +350,7 @@ def _normalize_speaker_ref(
353350 speaker_nodes_data = []
354351 for speaker_id in speaker_ids_seen :
355352 meta = speaker_meta .get (speaker_id , {})
356- label = (
357- meta .get ("full_name" ) or meta .get ("normalized_name" ) or speaker_id
358- )
353+ label = meta .get ("full_name" ) or meta .get ("normalized_name" ) or speaker_id
359354 aliases = []
360355 for candidate in (
361356 meta .get ("full_name" ),
@@ -435,13 +430,11 @@ def _normalize_speaker_ref(
435430 target_id = temp_to_canonical .get (target_ref , target_ref )
436431
437432 if not (
438- edge .source_ref .startswith ("speaker_" )
439- or edge .source_ref in temp_to_canonical
433+ edge .source_ref .startswith ("speaker_" ) or edge .source_ref in temp_to_canonical
440434 ):
441435 stats ["links_to_known" ] += 1
442436 if not (
443- edge .target_ref .startswith ("speaker_" )
444- or edge .target_ref in temp_to_canonical
437+ edge .target_ref .startswith ("speaker_" ) or edge .target_ref in temp_to_canonical
445438 ):
446439 stats ["links_to_known" ] += 1
447440
@@ -554,13 +547,9 @@ def _embed_new_nodes(self, node_ids: list[str]) -> None:
554547
555548 ids = [x [0 ] for x in to_embed ]
556549 texts = [x [1 ] for x in to_embed ]
557- embeddings = self .embedding .generate_embeddings_batch (
558- texts , task_type = "RETRIEVAL_DOCUMENT"
559- )
550+ embeddings = self .embedding .generate_embeddings_batch (texts , task_type = "RETRIEVAL_DOCUMENT" )
560551
561- update_rows = [
562- (vector_literal (vec ), node_id ) for node_id , vec in zip (ids , embeddings )
563- ]
552+ update_rows = [(vector_literal (vec ), node_id ) for node_id , vec in zip (ids , embeddings )]
564553 self .postgres .execute_batch (
565554 """
566555 UPDATE kg_nodes
0 commit comments