File tree Expand file tree Collapse file tree 2 files changed +45
-26
lines changed
pkgs/development/python-modules Expand file tree Collapse file tree 2 files changed +45
-26
lines changed Original file line number Diff line number Diff line change 22 lib ,
33 buildPythonPackage ,
44 fetchFromGitHub ,
5+
6+ # build-system
57 poetry-core ,
8+
69 # dependencies
7- torch ,
8- torchvision ,
9- transformers ,
10+ docling-core ,
1011 huggingface-hub ,
1112 jsonlines ,
1213 numpy ,
1314 opencv-python-headless ,
1415 pillow ,
15- tqdm ,
16+ pydantic ,
1617 safetensors ,
18+ torch ,
19+ torchvision ,
20+ tqdm ,
21+ transformers ,
22+
23+ # tests
24+ datasets ,
1725 pytestCheckHook ,
26+ writableTmpDirAsHomeHook ,
1827} :
1928
2029buildPythonPackage rec {
2130 pname = "docling-ibm-models" ;
22- version = "3.3.2 " ;
31+ version = "3.4.1 " ;
2332 pyproject = true ;
2433
2534 src = fetchFromGitHub {
2635 owner = "DS4SD" ;
2736 repo = "docling-ibm-models" ;
2837 tag = "v${ version } " ;
29- hash = "sha256-8mqDgbTj5g6jXEumj16Me9NjHLCOdR+pXmAwn2dghfg =" ;
38+ hash = "sha256-IgKP+4en0N6xLBjzwmddDk8z5P3J1vo+UMW+65a01Ww =" ;
3039 } ;
3140
3241 build-system = [
3342 poetry-core
3443 ] ;
3544
3645 dependencies = [
37- torch
38- torchvision
39- transformers
40- numpy
46+ docling-core
47+ huggingface-hub
4148 jsonlines
42- pillow
43- tqdm
49+ numpy
4450 opencv-python-headless
45- huggingface-hub
51+ pillow
52+ pydantic
4653 safetensors
54+ torch
55+ torchvision
56+ tqdm
57+ transformers
4758 ] ;
4859
4960 pythonRelaxDeps = [
50- "pillow"
51- "torchvision"
5261 "transformers"
5362 "numpy"
5463 ] ;
@@ -58,19 +67,18 @@ buildPythonPackage rec {
5867 ] ;
5968
6069 nativeCheckInputs = [
70+ datasets
6171 pytestCheckHook
72+ writableTmpDirAsHomeHook
6273 ] ;
6374
64- preCheck = ''
65- export HOME="$TEMPDIR"
66- '' ;
67-
6875 disabledTests = [
6976 # Requires network access
70- "test_layoutpredictor"
71- "test_tf_predictor"
7277 "test_code_formula_predictor" # huggingface_hub.errors.LocalEntryNotFoundError
7378 "test_figure_classifier" # huggingface_hub.errors.LocalEntryNotFoundError
79+ "test_layoutpredictor"
80+ "test_readingorder"
81+ "test_tf_predictor"
7482 ] ;
7583
7684 meta = {
Original file line number Diff line number Diff line change 99 # dependencies
1010 beautifulsoup4 ,
1111 certifi ,
12- deepsearch-glm ,
1312 docling-core ,
1413 docling-ibm-models ,
1514 docling-parse ,
4948
5049buildPythonPackage rec {
5150 pname = "docling" ;
52- version = "2.23.0 " ;
51+ version = "2.25.1 " ;
5352 pyproject = true ;
5453
5554 src = fetchFromGitHub {
5655 owner = "DS4SD" ;
5756 repo = "docling" ;
5857 tag = "v${ version } " ;
59- hash = "sha256-ySywKaLxjtgQM7RtzJrxZDS3z8uMwAwPDYO51uKHT28 =" ;
58+ hash = "sha256-uJZIwXVwGd9xDBQkZ/uz2XLJ+lL1ZAZHJv/jHtW/LCk =" ;
6059 } ;
6160
6261 build-system = [
@@ -66,7 +65,6 @@ buildPythonPackage rec {
6665 dependencies = [
6766 beautifulsoup4
6867 certifi
69- deepsearch-glm
7068 docling-core
7169 docling-ibm-models
7270 docling-parse
@@ -133,6 +131,19 @@ buildPythonPackage rec {
133131 "test_e2e_pdfs_conversions" # AssertionError: ## TableFormer: Table Structure Understanding with Transf
134132 "test_e2e_conversions" # RuntimeError: Tesseract is not available
135133
134+ # AssertionError
135+ # assert doc.export_to_markdown() == pair[1], f"Error in case {idx}"
136+ "test_ordered_lists"
137+
138+ # AssertionError: export to md
139+ "test_e2e_html_conversions"
140+
141+ # AssertionError: assert 'Unordered li...d code block:' == 'Unordered li...d code block:'
142+ "test_convert_valid"
143+
144+ # AssertionError: Markdown file mismatch against groundtruth pftaps057006474.md
145+ "test_patent_groundtruth"
146+
136147 # huggingface_hub.errors.LocalEntryNotFoundError: An error happened
137148 "test_cli_convert"
138149 "test_code_and_formula_conversion"
@@ -152,7 +163,7 @@ buildPythonPackage rec {
152163 meta = {
153164 description = "Get your documents ready for gen AI" ;
154165 homepage = "https://github.com/DS4SD/docling" ;
155- changelog = "https://github.com/DS4SD/docling/blob/${ src . rev } /CHANGELOG.md" ;
166+ changelog = "https://github.com/DS4SD/docling/blob/v ${ version } /CHANGELOG.md" ;
156167 license = lib . licenses . mit ;
157168 maintainers = with lib . maintainers ; [ happysalada ] ;
158169 mainProgram = "docling" ;
You can’t perform that action at this time.
0 commit comments