88import pathlib
99import uuid
1010import warnings
11- from collections .abc import Container , Iterator , Sequence
11+ from collections .abc import Container , Iterator , Mapping , Sequence
1212from threading import RLock
13- from typing import Any , Callable , Literal , Optional , Tuple , Union , Mapping
13+ from typing import Any , Callable , Literal , Optional , Tuple , Union
1414
1515import fsspec
1616import geopandas as gpd
5252from ..error import DataStoreError
5353from ..search import DefaultSearchMixin
5454from ..store import MutableDataStore
55- from .accessor import STORAGE_OPTIONS_PARAM_NAME , FsAccessor , FsDataAccessor
55+ from .accessor import STORAGE_OPTIONS_PARAM_NAME , FsAccessor
5656
5757_DEFAULT_DATA_TYPE = DATASET_TYPE .alias
5858_DEFAULT_FORMAT_ID = "zarr"
@@ -277,7 +277,7 @@ def get_data_opener_ids(
277277 predicate = get_data_accessor_predicate (
278278 data_type = acc_data_type_alias ,
279279 format_id = format_id ,
280- storage_id = storage_id
280+ storage_id = storage_id ,
281281 )
282282 )
283283 )
@@ -287,8 +287,7 @@ def get_data_opener_ids(
287287 ext .name
288288 for ext in find_data_opener_extensions (
289289 predicate = get_data_accessor_predicate (
290- data_type = data_type ,
291- storage_id = storage_id
290+ data_type = data_type , storage_id = storage_id
292291 )
293292 )
294293 )
@@ -419,47 +418,48 @@ def _get_delete_data_params_schema(writer: DataWriter, data_id: str):
419418
420419 def _get_filename_ext_to_format_openers (self ):
421420 if not self ._filename_ext_to_format_openers :
422- (self . _filename_ext_to_format_openers ,
423- self . _format_to_data_type_aliases_openers ) = (
424- self ._set_infos_from_extensions (
425- find_data_opener_extensions , self .protocol
426- )
421+ (
422+ self . _filename_ext_to_format_openers ,
423+ self ._format_to_data_type_aliases_openers ,
424+ ) = self ._set_infos_from_extensions (
425+ find_data_opener_extensions , self . protocol
427426 )
428427 return self ._filename_ext_to_format_openers
429428
430429 def _get_format_to_data_type_aliases_openers (self ):
431430 if not self ._format_to_data_type_aliases_openers :
432- (self . _filename_ext_to_format_openers ,
433- self . _format_to_data_type_aliases_openers ) = (
434- self ._set_infos_from_extensions (
435- find_data_opener_extensions , self .protocol
436- )
431+ (
432+ self . _filename_ext_to_format_openers ,
433+ self ._format_to_data_type_aliases_openers ,
434+ ) = self ._set_infos_from_extensions (
435+ find_data_opener_extensions , self . protocol
437436 )
438437 return self ._format_to_data_type_aliases_openers
439438
440439 def _get_filename_ext_to_format_writers (self ):
441440 if not self ._filename_ext_to_format_writers :
442- (self . _filename_ext_to_format_writers ,
443- self . _format_to_data_type_aliases_writers ) = (
444- self ._set_infos_from_extensions (
445- find_data_writer_extensions , self .protocol
446- )
441+ (
442+ self . _filename_ext_to_format_writers ,
443+ self ._format_to_data_type_aliases_writers ,
444+ ) = self ._set_infos_from_extensions (
445+ find_data_writer_extensions , self . protocol
447446 )
448447 return self ._filename_ext_to_format_writers
449448
450449 def _get_format_to_data_type_aliases_writers (self ):
451450 if not self ._format_to_data_type_aliases_writers :
452- (self . _filename_ext_to_format_writers ,
453- self . _format_to_data_type_aliases_writers ) = (
454- self ._set_infos_from_extensions (
455- find_data_writer_extensions , self .protocol
456- )
451+ (
452+ self . _filename_ext_to_format_writers ,
453+ self ._format_to_data_type_aliases_writers ,
454+ ) = self ._set_infos_from_extensions (
455+ find_data_writer_extensions , self . protocol
457456 )
458457 return self ._format_to_data_type_aliases_writers
459458
460459 @classmethod
461- def _set_infos_from_extensions (cls , find_extensions , protocol = None ) -> (
462- Tuple )[dict , dict ]:
460+ def _set_infos_from_extensions (
461+ cls , find_extensions , protocol = None
462+ ) -> (Tuple )[dict , dict ]:
463463 filename_ext_to_format = {}
464464 format_to_data_type_aliases = {}
465465 predicate = get_data_accessor_predicate (storage_id = protocol )
@@ -471,12 +471,12 @@ def _set_infos_from_extensions(cls, find_extensions, protocol=None) -> (
471471 filename_ext_to_format [extension ] = fmt
472472 if data_type == "mldataset" :
473473 format_to_data_type_aliases [fmt ] = (
474- ( data_type , ) + format_to_data_type_aliases . get ( fmt , ())
475- )
474+ data_type ,
475+ ) + format_to_data_type_aliases . get ( fmt , ())
476476 else :
477- format_to_data_type_aliases [fmt ] = (
478- format_to_data_type_aliases . get ( fmt , ()) + ( data_type , )
479- )
477+ format_to_data_type_aliases [fmt ] = format_to_data_type_aliases . get (
478+ fmt , ()
479+ ) + ( data_type ,)
480480 return filename_ext_to_format , format_to_data_type_aliases
481481
482482 def _get_data_types (self ):
@@ -519,10 +519,7 @@ def _guess_writer_id(self, data, data_id: str = None):
519519 return extensions [0 ].name
520520
521521 def _find_opener (
522- self ,
523- opener_id : str = None ,
524- data_id : str = None ,
525- data_type : DataTypeLike = None
522+ self , opener_id : str = None , data_id : str = None , data_type : DataTypeLike = None
526523 ) -> DataOpener :
527524 if not opener_id :
528525 opener_id = self ._find_opener_id (
@@ -540,7 +537,9 @@ def _is_data_type_available(self, data_id: str, data_type: DataTypeLike) -> bool
540537 format_id = self ._get_filename_ext_to_format_openers ().get (ext .lower ())
541538 if format_id is None :
542539 return False
543- avail_data_types = self ._get_format_to_data_type_aliases_openers ().get (format_id )
540+ avail_data_types = self ._get_format_to_data_type_aliases_openers ().get (
541+ format_id
542+ )
544543 data_type = DataType .normalize (data_type )
545544 return any (
546545 data_type .is_super_type_of (avail_data_type )
@@ -601,8 +600,10 @@ def _find_opener_id(
601600
602601 def _find_writer_id (self , data_id : str = None , require = True ) -> Optional [str ]:
603602 return self ._find_accessor_id (
604- find_data_writer_extensions , self ._guess_best_writer_id_parts ,
605- data_id = data_id , require = require
603+ find_data_writer_extensions ,
604+ self ._guess_best_writer_id_parts ,
605+ data_id = data_id ,
606+ require = require ,
606607 )
607608
608609 def _find_accessor_id (
@@ -677,7 +678,9 @@ def _guess_all_opener_id_parts(
677678 return self ._guess_all_accessor_id_parts (
678679 self ._get_filename_ext_to_format_openers (),
679680 self ._get_format_to_data_type_aliases_openers (),
680- data_id , data_type , require
681+ data_id ,
682+ data_type ,
683+ require ,
681684 )
682685
683686 def _guess_best_opener_id_parts (
@@ -686,7 +689,9 @@ def _guess_best_opener_id_parts(
686689 return self ._guess_best_accessor_id_parts (
687690 self ._get_filename_ext_to_format_openers (),
688691 self ._get_format_to_data_type_aliases_openers (),
689- data_id , data_type , require
692+ data_id ,
693+ data_type ,
694+ require ,
690695 )
691696
692697 def _guess_best_writer_id_parts (
@@ -695,12 +700,18 @@ def _guess_best_writer_id_parts(
695700 return self ._guess_best_accessor_id_parts (
696701 self ._get_filename_ext_to_format_writers (),
697702 self ._get_format_to_data_type_aliases_writers (),
698- data_id , data_type , require
703+ data_id ,
704+ data_type ,
705+ require ,
699706 )
700707
701708 def _guess_all_accessor_id_parts (
702- self , filename_ext_to_format , format_to_data_type_alias ,
703- data_id : str , data_type : DataTypeLike = None , require = True
709+ self ,
710+ filename_ext_to_format ,
711+ format_to_data_type_alias ,
712+ data_id : str ,
713+ data_type : DataTypeLike = None ,
714+ require = True ,
704715 ) -> list [tuple [str , str , str ]]:
705716 assert_given (data_id , "data_id" )
706717 ext = self ._get_filename_ext (data_id )
@@ -720,12 +731,19 @@ def _guess_all_accessor_id_parts(
720731 return [(dta , format_id , self .protocol ) for dta in data_type_aliases ]
721732
722733 def _guess_best_accessor_id_parts (
723- self , filename_ext_to_format , format_to_data_type_alias ,
724- data_id : str , data_type : DataTypeLike = None , require = True
734+ self ,
735+ filename_ext_to_format ,
736+ format_to_data_type_alias ,
737+ data_id : str ,
738+ data_type : DataTypeLike = None ,
739+ require = True ,
725740 ) -> tuple [str , str , str ]:
726741 accessor_id_parts = self ._guess_all_accessor_id_parts (
727- filename_ext_to_format , format_to_data_type_alias , data_id , data_type ,
728- require
742+ filename_ext_to_format ,
743+ format_to_data_type_alias ,
744+ data_id ,
745+ data_type ,
746+ require ,
729747 )
730748 return accessor_id_parts [0 ] if len (accessor_id_parts ) > 0 else accessor_id_parts
731749
@@ -908,9 +926,7 @@ def get_filename_extensions(
908926 )
909927 filename_extensions = {}
910928 filename_ext_to_format , format_to_data_type_aliases = (
911- cls ._set_infos_from_extensions (
912- find_extensions , cls .get_protocol ()
913- )
929+ cls ._set_infos_from_extensions (find_extensions , cls .get_protocol ())
914930 )
915931 for filename_ext , fmt in filename_ext_to_format .items ():
916932 data_type_aliases = format_to_data_type_aliases .get (fmt , [])
0 commit comments