@@ -89,7 +89,9 @@ def _file_exists(filename):
8989
9090 # read alternative values either as csv or feather file
9191 alt_values_fea_file = alt_values_file .replace (".csv" , ".fea" )
92- if os .path .exists (os .path .join (edb_directory , alt_values_fea_file .format (name = name ))):
92+ if os .path .exists (
93+ os .path .join (edb_directory , alt_values_fea_file .format (name = name ))
94+ ):
9395 alt_values = _read_feather (alt_values_fea_file )
9496 else :
9597 alt_values = _read_csv (alt_values_file )
@@ -183,12 +185,14 @@ def _file_exists(filename):
183185
184186 def split (a , n ):
185187 k , m = divmod (len (a ), n )
186- return (a [i * k + min (i , m ): (i + 1 ) * k + min (i + 1 , m )] for i in range (n ))
188+ return (a [i * k + min (i , m ) : (i + 1 ) * k + min (i + 1 , m )] for i in range (n ))
187189
188190 # process x_ca with cv_to_ca with or without chunking
189191 x_ca_pickle_file = "{name}_x_ca.pkl"
190192 if chunking_size == None :
191- x_ca = cv_to_ca (alt_values .set_index ([chooser_index_name , alt_values .columns [1 ]]))
193+ x_ca = cv_to_ca (
194+ alt_values .set_index ([chooser_index_name , alt_values .columns [1 ]])
195+ )
192196 elif _file_exists (x_ca_pickle_file ):
193197 # if pickle file from previous x_ca processing exist, load it to save time
194198 time_start = datetime .now ()
@@ -207,7 +211,8 @@ def split(a, n):
207211 for chunk_ids in split_ids :
208212 alt_values_i = alt_values [alt_values ["person_id" ].isin (chunk_ids )]
209213 x_ca_i = cv_to_ca (
210- alt_values_i .set_index ([chooser_index_name , alt_values_i .columns [1 ]]))
214+ alt_values_i .set_index ([chooser_index_name , alt_values_i .columns [1 ]])
215+ )
211216 x_ca_list .append (x_ca_i )
212217 print (
213218 f"\r x_ca_i compute done for chunk { i } /{ num_chunks } - time elapsed { (datetime .now () - time_start ).total_seconds ()} "
@@ -217,7 +222,8 @@ def split(a, n):
217222 # save final x_ca result as pickle file to save time for future data loading
218223 _to_pickle (df = x_ca , filename = x_ca_pickle_file )
219224 print (
220- f"x_ca compute done - time elapsed { (datetime .now () - time_start ).total_seconds ()} " )
225+ f"x_ca compute done - time elapsed { (datetime .now () - time_start ).total_seconds ()} "
226+ )
221227
222228 if CHOOSER_SEGMENT_COLUMN_NAME is not None :
223229 # label segments with names
0 commit comments