1616from azure .identity import DefaultAzureCredential
1717from datashaper import Progress
1818
19- from graphrag .logging .base import ProgressReporter
19+ from graphrag .logger .base import ProgressLogger
2020from graphrag .storage .pipeline_storage import PipelineStorage
2121
2222log = logging .getLogger (__name__ )
@@ -97,7 +97,7 @@ def find(
9797 self ,
9898 file_pattern : re .Pattern [str ],
9999 base_dir : str | None = None ,
100- progress : ProgressReporter | None = None ,
100+ progress : ProgressLogger | None = None ,
101101 file_filter : dict [str , Any ] | None = None ,
102102 max_count = - 1 ,
103103 ) -> Iterator [tuple [str , dict [str , Any ]]]:
@@ -186,18 +186,18 @@ async def get(
186186 items_list = list (queried_items )
187187 for item in items_list :
188188 item ["id" ] = item ["id" ].split (":" )[1 ]
189-
189+
190190 items_json_str = json .dumps (items_list )
191191
192192 items_df = pd .read_json (
193193 StringIO (items_json_str ), orient = "records" , lines = False
194194 )
195195 return items_df .to_parquet ()
196-
196+
197197 item = container_client .read_item (item = key , partition_key = key )
198198 item_body = item .get ("body" )
199199 return json .dumps (item_body )
200-
200+
201201 except Exception :
202202 log .exception ("Error reading item %s" , key )
203203 return None
@@ -224,7 +224,7 @@ async def set(self, key: str, value: Any, encoding: str | None = None) -> None:
224224 cosmosdb_item_list = json .loads (value_json )
225225 for cosmosdb_item in cosmosdb_item_list :
226226 # Append an additional prefix to the id to force a unique identifier for the create_final_nodes rows
227- if ( prefix == "create_final_nodes" ) :
227+ if prefix == "create_final_nodes" :
228228 prefixed_id = f"{ prefix } -community_{ cosmosdb_item ['community' ]} :{ cosmosdb_item ['id' ]} "
229229 else :
230230 prefixed_id = f"{ prefix } :{ cosmosdb_item ['id' ]} "
@@ -250,7 +250,7 @@ async def has(self, key: str) -> bool:
250250 prefix = self ._get_prefix (key )
251251 query = f"SELECT * FROM c WHERE STARTSWITH(c.id, '{ prefix } ')" # noqa: S608
252252 queried_items = container_client .query_items (
253- query = query , enable_cross_partition_query = True
253+ query = query , enable_cross_partition_query = True
254254 )
255255 return len (list (queried_items )) > 0
256256 return False
@@ -264,7 +264,7 @@ async def delete(self, key: str) -> None:
264264 prefix = self ._get_prefix (key )
265265 query = f"SELECT * FROM c WHERE STARTSWITH(c.id, '{ prefix } ')" # noqa: S608
266266 queried_items = container_client .query_items (
267- query = query , enable_cross_partition_query = True
267+ query = query , enable_cross_partition_query = True
268268 )
269269 for item in queried_items :
270270 container_client .delete_item (item = item ["id" ], partition_key = item ["id" ])
@@ -290,7 +290,7 @@ def keys(self) -> list[str]:
290290 def child (self , name : str | None ) -> PipelineStorage :
291291 """Create a child storage instance."""
292292 return self
293-
293+
294294 def _get_prefix (self , key : str ) -> str :
295295 """Get the prefix of the filename key."""
296296 return key .split ("." )[0 ]
0 commit comments