1717from collections .abc import Callable
1818from typing import TYPE_CHECKING
1919
20- from sec_certs .configuration import config
21- from sec_certs .converter import PDFConverter
2220from sec_certs .dataset .auxiliary_dataset_handling import (
2321 CCSchemeDatasetHandler ,
2422 CPEDatasetHandler ,
5957from sec_certs .utils .profiling import staged
6058
6159if TYPE_CHECKING :
60+ from sec_certs .configuration import config
61+ from sec_certs .converter import PDFConverter
6262 from sec_certs .dataset .cc import CCDataset
6363 from sec_certs .dataset .eucc import EUCCDataset
6464
@@ -82,7 +82,7 @@ def download_pdfs(
8282
8383 if not fresh :
8484 logger .info (
85- f"Downloading { len (certs_to_process )} PDFs of { obj .dataset_name } { doc_type .long } s for which previous download failed."
85+ f"Downloading { len (certs_to_process )} PDFs of { obj .name } { doc_type .long } s for which previous download failed."
8686 )
8787
8888 download_pdf_funcs = {
@@ -94,7 +94,7 @@ def download_pdfs(
9494 cert_processing .process_parallel (
9595 download_pdf_funcs [doc_type ],
9696 certs_to_process ,
97- progress_bar_desc = f"Downloading PDFs of { obj .dataset_name } { doc_type .long } s" ,
97+ progress_bar_desc = f"Downloading PDFs of { obj .name } { doc_type .long } s" ,
9898 )
9999
100100
@@ -136,7 +136,7 @@ def convert_pdfs(
136136
137137 if not fresh :
138138 logger .info (
139- f"Converting { len (certs_to_process )} PDFs of { obj .dataset_name } { doc_type .long } s for which previous conversion failed."
139+ f"Converting { len (certs_to_process )} PDFs of { obj .name } { doc_type .long } s for which previous conversion failed."
140140 )
141141
142142 convert_pdf_funcs = {
@@ -152,7 +152,7 @@ def convert_pdfs(
152152 certs_to_process ,
153153 config .pdf_conversion_workers ,
154154 config .pdf_conversion_max_chunk_size ,
155- progress_bar_desc = f"Converting PDFs of { obj .dataset_name } { doc_type .long } s" ,
155+ progress_bar_desc = f"Converting PDFs of { obj .name } { doc_type .long } s" ,
156156 )
157157
158158 obj .update_with_certs (processed_certs )
@@ -189,7 +189,7 @@ def extract_generic(obj: CCDataset | EUCCDataset, doc_type: DocType, worker_func
189189 worker_func ,
190190 certs_to_process ,
191191 use_threading = False ,
192- progress_bar_desc = f"Extracting { obj .dataset_name } { doc_type .long } { worker_func .__name__ .split ('_' )[- 1 ]} " ,
192+ progress_bar_desc = f"Extracting { obj .name } { doc_type .long } { worker_func .__name__ .split ('_' )[- 1 ]} " ,
193193 )
194194 obj .update_with_certs (processed )
195195
0 commit comments