Skip to content

Commit 6fdd748

Browse files
cau-gitdolfim-ibm
andauthored
feat!: Upgrade to v2.0.0 (#48)
* feat!: Upgrade to v2.0.0 Signed-off-by: Christoph Auer <[email protected]> * Dummy change Signed-off-by: Christoph Auer <[email protected]> * rename old parser as pdf_parser_v1 Signed-off-by: Michele Dolfi <[email protected]> --------- Signed-off-by: Christoph Auer <[email protected]> Signed-off-by: Christoph Auer <[email protected]> Signed-off-by: Michele Dolfi <[email protected]> Co-authored-by: Michele Dolfi <[email protected]>
1 parent 48451ad commit 6fdd748

File tree

7 files changed

+17
-17
lines changed

7 files changed

+17
-17
lines changed

.github/scripts/build_rhel.sh

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -42,7 +42,7 @@ docker build --progress=plain \
4242
COPY ./dist/*.tar.gz /src/
4343
4444
RUN USE_SYSTEM_DEPS=\$USE_SYSTEM_DEPS pip3.11 install /src/docling_parse*.tar.gz \
45-
&& python3.11 -c 'from docling_parse.docling_parse import pdf_parser, pdf_parser_v2'
45+
&& python3.11 -c 'from docling_parse.docling_parse import pdf_parser_v1, pdf_parser_v2'
4646
4747
COPY ./tests /src/tests
4848

README.md

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -164,7 +164,7 @@ To build the package, simply run (make sure [poetry](https://python-poetry.org/)
164164
poetry build
165165
```
166166

167-
To test the package, run,
167+
To test the package, run:
168168

169169
```
170170
poetry run pytest ./tests -v -s

app/pybind_parse.cpp

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
PYBIND11_MODULE(docling_parse, m) {
1414

1515
// purely for backward compatibility
16-
pybind11::class_<docling::docling_parser_v1>(m, "pdf_parser")
16+
pybind11::class_<docling::docling_parser_v1>(m, "pdf_parser_v1")
1717
.def(pybind11::init())
1818

1919
.def("set_loglevel", &docling::docling_parser_v1::set_loglevel)

docling_parse/eval.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55

66
from tabulate import tabulate
77

8-
from docling_parse.docling_parse import pdf_parser
8+
from docling_parse.docling_parse import pdf_parser_v1
99

1010

1111
def main():
@@ -52,7 +52,7 @@ def main():
5252

5353
# Print the path to the PDF file (or add your processing logic here)
5454

55-
parser = pdf_parser()
55+
parser = pdf_parser_v1()
5656
parser.set_loglevel(args.log_level)
5757

5858
overview = []

docling_parse/run.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -4,7 +4,7 @@
44
from tabulate import tabulate
55

66
import docling_parse
7-
from docling_parse.docling_parse import pdf_parser
7+
from docling_parse.docling_parse import pdf_parser_v1
88

99

1010
def main():
@@ -37,7 +37,7 @@ def main():
3737

3838
# Print the path to the PDF file (or add your processing logic here)
3939

40-
parser = pdf_parser()
40+
parser = pdf_parser_v1()
4141
parser.set_loglevel(args.log_level)
4242

4343
doc_file = args.pdf # filename

docling_parse/visualize.py

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -5,7 +5,7 @@
55

66
from tabulate import tabulate
77

8-
from docling_parse import pdf_parser, pdf_parser_v2
8+
from docling_parse import pdf_parser_v1, pdf_parser_v2
99

1010
try:
1111
from PIL import Image, ImageDraw
@@ -98,7 +98,7 @@ def visualise_v1(
9898
log_level: str, pdf_path: str, interactive: str, output_dir: str, page_num: int
9999
):
100100

101-
parser = pdf_parser()
101+
parser = pdf_parser_v1()
102102
parser.set_loglevel_with_label(log_level)
103103

104104
doc_key = "key"

tests/test_parse_v1.py

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -38,7 +38,7 @@ def verify_reference_output(true_doc, pred_doc):
3838
"""
3939
def test_reference_documents_from_filenames():
4040
41-
parser = docling_parse.pdf_parser()
41+
parser = docling_parse.pdf_parser_v1()
4242
4343
pdf_docs = glob.glob("./tests/pdf_docs/tests/*.pdf")
4444
@@ -63,7 +63,7 @@ def test_reference_documents_from_filenames():
6363
"""
6464
def test_reference_documents_from_filenames_page_by_page():
6565
66-
parser = docling_parse.pdf_parser()
66+
parser = docling_parse.pdf_parser_v1()
6767
6868
pdf_docs = glob.glob("./tests/pdf_docs/tests/*.pdf")
6969
@@ -90,7 +90,7 @@ def test_reference_documents_from_filenames_page_by_page():
9090

9191
def test_reference_documents_from_filenames_with_keys():
9292

93-
parser = docling_parse.pdf_parser()
93+
parser = docling_parse.pdf_parser_v1()
9494
#parser.set_loglevel(4)
9595

9696
pdf_docs = glob.glob("./tests/pdf_docs/tests/*.pdf")
@@ -129,7 +129,7 @@ def test_reference_documents_from_filenames_with_keys():
129129

130130
def test_reference_documents_from_filenames_with_keys_page_by_page():
131131

132-
parser = docling_parse.pdf_parser()
132+
parser = docling_parse.pdf_parser_v1()
133133
#parser.set_loglevel(0)
134134

135135
pdf_docs = glob.glob("./tests/pdf_docs/tests/*.pdf")
@@ -176,7 +176,7 @@ def test_reference_documents_from_filenames_with_keys_page_by_page():
176176
"""
177177
def test_reference_documents_from_bytesio():
178178
179-
parser = docling_parse.pdf_parser()
179+
parser = docling_parse.pdf_parser_v1()
180180
181181
pdf_docs = glob.glob("./tests/pdf_docs/tests/*.pdf")
182182
@@ -209,7 +209,7 @@ def test_reference_documents_from_bytesio():
209209
"""
210210
def test_reference_documents_from_bytesio_page_by_page():
211211
212-
parser = docling_parse.pdf_parser()
212+
parser = docling_parse.pdf_parser_v1()
213213
#parser.set_loglevel(1)
214214
215215
pdf_docs = glob.glob("./tests/pdf_docs/tests/*.pdf")
@@ -244,7 +244,7 @@ def test_reference_documents_from_bytesio_page_by_page():
244244

245245
def test_reference_documents_from_bytesio_with_keys():
246246

247-
parser = docling_parse.pdf_parser()
247+
parser = docling_parse.pdf_parser_v1()
248248

249249
pdf_docs = glob.glob("./tests/pdf_docs/tests/*.pdf")
250250

@@ -284,7 +284,7 @@ def test_reference_documents_from_bytesio_with_keys():
284284
assert verify_reference_output(true_doc, pred_doc), "verify_reference_output(true_doc, pred_doc)"
285285
def test_reference_documents_from_bytesio_with_keys_page_by_page():
286286

287-
parser = docling_parse.pdf_parser()
287+
parser = docling_parse.pdf_parser_v1()
288288
#parser.set_loglevel(4)
289289

290290
pdf_docs = glob.glob("./tests/pdf_docs/tests/*.pdf")

0 commit comments

Comments
 (0)