Skip to content

Commit af0c7c7

Browse files
authored
python312Packages.docling: 2.23.0 -> 2.25.1 (#386660)
2 parents 7768e6b + 4c5af10 commit af0c7c7

File tree

2 files changed

+45
-26
lines changed

2 files changed

+45
-26
lines changed

pkgs/development/python-modules/docling-ibm-models/default.nix

Lines changed: 29 additions & 21 deletions
Original file line numberDiff line numberDiff line change
@@ -2,53 +2,62 @@
22
lib,
33
buildPythonPackage,
44
fetchFromGitHub,
5+
6+
# build-system
57
poetry-core,
8+
69
# dependencies
7-
torch,
8-
torchvision,
9-
transformers,
10+
docling-core,
1011
huggingface-hub,
1112
jsonlines,
1213
numpy,
1314
opencv-python-headless,
1415
pillow,
15-
tqdm,
16+
pydantic,
1617
safetensors,
18+
torch,
19+
torchvision,
20+
tqdm,
21+
transformers,
22+
23+
# tests
24+
datasets,
1725
pytestCheckHook,
26+
writableTmpDirAsHomeHook,
1827
}:
1928

2029
buildPythonPackage rec {
2130
pname = "docling-ibm-models";
22-
version = "3.3.2";
31+
version = "3.4.1";
2332
pyproject = true;
2433

2534
src = fetchFromGitHub {
2635
owner = "DS4SD";
2736
repo = "docling-ibm-models";
2837
tag = "v${version}";
29-
hash = "sha256-8mqDgbTj5g6jXEumj16Me9NjHLCOdR+pXmAwn2dghfg=";
38+
hash = "sha256-IgKP+4en0N6xLBjzwmddDk8z5P3J1vo+UMW+65a01Ww=";
3039
};
3140

3241
build-system = [
3342
poetry-core
3443
];
3544

3645
dependencies = [
37-
torch
38-
torchvision
39-
transformers
40-
numpy
46+
docling-core
47+
huggingface-hub
4148
jsonlines
42-
pillow
43-
tqdm
49+
numpy
4450
opencv-python-headless
45-
huggingface-hub
51+
pillow
52+
pydantic
4653
safetensors
54+
torch
55+
torchvision
56+
tqdm
57+
transformers
4758
];
4859

4960
pythonRelaxDeps = [
50-
"pillow"
51-
"torchvision"
5261
"transformers"
5362
"numpy"
5463
];
@@ -58,19 +67,18 @@ buildPythonPackage rec {
5867
];
5968

6069
nativeCheckInputs = [
70+
datasets
6171
pytestCheckHook
72+
writableTmpDirAsHomeHook
6273
];
6374

64-
preCheck = ''
65-
export HOME="$TEMPDIR"
66-
'';
67-
6875
disabledTests = [
6976
# Requires network access
70-
"test_layoutpredictor"
71-
"test_tf_predictor"
7277
"test_code_formula_predictor" # huggingface_hub.errors.LocalEntryNotFoundError
7378
"test_figure_classifier" # huggingface_hub.errors.LocalEntryNotFoundError
79+
"test_layoutpredictor"
80+
"test_readingorder"
81+
"test_tf_predictor"
7482
];
7583

7684
meta = {

pkgs/development/python-modules/docling/default.nix

Lines changed: 16 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,6 @@
99
# dependencies
1010
beautifulsoup4,
1111
certifi,
12-
deepsearch-glm,
1312
docling-core,
1413
docling-ibm-models,
1514
docling-parse,
@@ -49,14 +48,14 @@
4948

5049
buildPythonPackage rec {
5150
pname = "docling";
52-
version = "2.23.0";
51+
version = "2.25.1";
5352
pyproject = true;
5453

5554
src = fetchFromGitHub {
5655
owner = "DS4SD";
5756
repo = "docling";
5857
tag = "v${version}";
59-
hash = "sha256-ySywKaLxjtgQM7RtzJrxZDS3z8uMwAwPDYO51uKHT28=";
58+
hash = "sha256-uJZIwXVwGd9xDBQkZ/uz2XLJ+lL1ZAZHJv/jHtW/LCk=";
6059
};
6160

6261
build-system = [
@@ -66,7 +65,6 @@ buildPythonPackage rec {
6665
dependencies = [
6766
beautifulsoup4
6867
certifi
69-
deepsearch-glm
7068
docling-core
7169
docling-ibm-models
7270
docling-parse
@@ -133,6 +131,19 @@ buildPythonPackage rec {
133131
"test_e2e_pdfs_conversions" # AssertionError: ## TableFormer: Table Structure Understanding with Transf
134132
"test_e2e_conversions" # RuntimeError: Tesseract is not available
135133

134+
# AssertionError
135+
# assert doc.export_to_markdown() == pair[1], f"Error in case {idx}"
136+
"test_ordered_lists"
137+
138+
# AssertionError: export to md
139+
"test_e2e_html_conversions"
140+
141+
# AssertionError: assert 'Unordered li...d code block:' == 'Unordered li...d code block:'
142+
"test_convert_valid"
143+
144+
# AssertionError: Markdown file mismatch against groundtruth pftaps057006474.md
145+
"test_patent_groundtruth"
146+
136147
# huggingface_hub.errors.LocalEntryNotFoundError: An error happened
137148
"test_cli_convert"
138149
"test_code_and_formula_conversion"
@@ -152,7 +163,7 @@ buildPythonPackage rec {
152163
meta = {
153164
description = "Get your documents ready for gen AI";
154165
homepage = "https://github.com/DS4SD/docling";
155-
changelog = "https://github.com/DS4SD/docling/blob/${src.rev}/CHANGELOG.md";
166+
changelog = "https://github.com/DS4SD/docling/blob/v${version}/CHANGELOG.md";
156167
license = lib.licenses.mit;
157168
maintainers = with lib.maintainers; [ happysalada ];
158169
mainProgram = "docling";

0 commit comments

Comments
 (0)