File tree Expand file tree Collapse file tree 18 files changed +158
-103
lines changed
expected-structured-output-html/local-single-file-with-pdf-infer-table-structure
expected-structured-output/local-single-file-with-pdf-infer-table-structure
test_unstructured/cleaners Expand file tree Collapse file tree 18 files changed +158
-103
lines changed Original file line number Diff line number Diff line change 1+ ## 0.17.7
2+
3+ ### Enhancements
4+ - ** Updated Docker file with ENV HF_HUB_OFFLINE=1 to prevent the contianer from trying to access the internet
5+
6+ ### Features
7+
8+ ### Fixes
9+
110## 0.17.7-dev0
211
312### Enhancements
Original file line number Diff line number Diff line change @@ -31,4 +31,6 @@ RUN find requirements/ -type f -name "*.txt" ! -name "test.txt" ! -name "dev.txt
3131 $PYTHON -c "from unstructured.partition.model_init import initialize; initialize()" && \
3232 $PYTHON -c "from unstructured_inference.models.tables import UnstructuredTableTransformerModel; model = UnstructuredTableTransformerModel(); model.initialize('microsoft/table-transformer-structure-recognition')"
3333
34+ ENV HF_HUB_OFFLINE=1
35+
3436CMD ["/bin/bash" ]
Original file line number Diff line number Diff line change @@ -20,25 +20,25 @@ cffi==1.17.1
2020 # via cryptography
2121chardet==5.2.0
2222 # via -r ./base.in
23- charset-normalizer==3.4.1
23+ charset-normalizer==3.4.2
2424 # via
2525 # requests
2626 # unstructured-client
2727click==8.1.8
2828 # via
2929 # nltk
3030 # python-oxmsg
31- cryptography==44 .0.2
31+ cryptography==45 .0.3
3232 # via unstructured-client
3333dataclasses-json==0.6.7
3434 # via
3535 # -r ./base.in
3636 # unstructured-client
37- deepdiff==8.4.2
37+ deepdiff==8.5.0
3838 # via unstructured-client
3939emoji==2.14.1
4040 # via -r ./base.in
41- exceptiongroup==1.2.2
41+ exceptiongroup==1.3.0
4242 # via anyio
4343filetype==1.2.0
4444 # via -r ./base.in
@@ -56,7 +56,7 @@ idna==3.10
5656 # httpx
5757 # requests
5858 # unstructured-client
59- joblib==1.4.2
59+ joblib==1.5.1
6060 # via nltk
6161jsonpath-python==1.0.6
6262 # via unstructured-client
@@ -80,7 +80,7 @@ numpy==2.0.2
8080 # via -r ./base.in
8181olefile==0.47
8282 # via python-oxmsg
83- orderly-set==5.4.0
83+ orderly-set==5.4.1
8484 # via deepdiff
8585packaging==25.0
8686 # via
@@ -90,7 +90,7 @@ psutil==7.0.0
9090 # via -r ./base.in
9191pycparser==2.22
9292 # via cffi
93- pypdf==5.4 .0
93+ pypdf==5.6 .0
9494 # via unstructured-client
9595python-dateutil==2.9.0.post0
9696 # via unstructured-client
@@ -125,11 +125,12 @@ tqdm==4.67.1
125125 # via
126126 # -r ./base.in
127127 # nltk
128- typing-extensions==4.13.2
128+ typing-extensions==4.14.0
129129 # via
130130 # -r ./base.in
131131 # anyio
132132 # beautifulsoup4
133+ # exceptiongroup
133134 # pypdf
134135 # python-oxmsg
135136 # typing-inspect
Original file line number Diff line number Diff line change @@ -17,9 +17,9 @@ distlib==0.3.9
1717 # via virtualenv
1818filelock==3.18.0
1919 # via virtualenv
20- identify==2.6.10
20+ identify==2.6.12
2121 # via pre-commit
22- importlib-metadata==8.6.1
22+ importlib-metadata==8.7.0
2323 # via
2424 # -c ././deps/constraints.txt
2525 # build
@@ -32,7 +32,7 @@ packaging==25.0
3232 # build
3333pip-tools==7.4.1
3434 # via -r ./dev.in
35- platformdirs==4.3.7
35+ platformdirs==4.3.8
3636 # via
3737 # -c ./test.txt
3838 # virtualenv
@@ -49,11 +49,11 @@ tomli==2.2.1
4949 # -c ./test.txt
5050 # build
5151 # pip-tools
52- virtualenv==20.30.0
52+ virtualenv==20.31.2
5353 # via pre-commit
5454wheel==0.45.1
5555 # via pip-tools
56- zipp==3.21 .0
56+ zipp==3.22 .0
5757 # via importlib-metadata
5858
5959# The following packages are considered to be unsafe in a requirements file:
Original file line number Diff line number Diff line change @@ -10,7 +10,7 @@ lxml==5.4.0
1010 # python-docx
1111python-docx==1.1.2
1212 # via -r ./extra-docx.in
13- typing-extensions==4.13.2
13+ typing-extensions==4.14.0
1414 # via
1515 # -c ./base.txt
1616 # python-docx
Original file line number Diff line number Diff line change 44#
55# pip-compile ./extra-markdown.in
66#
7- importlib-metadata==8.6.1
7+ importlib-metadata==8.7.0
88 # via
99 # -c ././deps/constraints.txt
1010 # markdown
1111markdown==3.8
1212 # via -r ./extra-markdown.in
13- zipp==3.21 .0
13+ zipp==3.22 .0
1414 # via importlib-metadata
Original file line number Diff line number Diff line change @@ -12,7 +12,7 @@ pypandoc==1.15
1212 # via -r ./extra-odt.in
1313python-docx==1.1.2
1414 # via -r ./extra-odt.in
15- typing-extensions==4.13.2
15+ typing-extensions==4.14.0
1616 # via
1717 # -c ./base.txt
1818 # python-docx
Original file line number Diff line number Diff line change 44#
55# pip-compile ./extra-paddleocr.in
66#
7- albucore==0.0.23
7+ albucore==0.0.24
88 # via
99 # albumentations
1010 # unstructured-paddleocr
11- albumentations==2.0.5
11+ albumentations==2.0.8
1212 # via unstructured-paddleocr
1313annotated-types==0.7.0
1414 # via pydantic
@@ -28,23 +28,23 @@ certifi==2025.4.26
2828 # httpcore
2929 # httpx
3030 # requests
31- charset-normalizer==3.4.1
31+ charset-normalizer==3.4.2
3232 # via
3333 # -c ./base.txt
3434 # requests
35- cython==3.0.12
35+ cython==3.1.1
3636 # via unstructured-paddleocr
3737decorator==5.2.1
3838 # via paddlepaddle
3939eval-type-backport==0.2.2
4040 # via albumentations
41- exceptiongroup==1.2.2
41+ exceptiongroup==1.3.0
4242 # via
4343 # -c ./base.txt
4444 # anyio
4545fire==0.7.0
4646 # via unstructured-paddleocr
47- fonttools==4.57.0
47+ fonttools==4.58.1
4848 # via unstructured-paddleocr
4949h11==0.16.0
5050 # via
@@ -115,15 +115,15 @@ pillow==11.2.1
115115 # paddlepaddle
116116 # scikit-image
117117 # unstructured-paddleocr
118- protobuf==6.30.2
118+ protobuf==6.31.1
119119 # via
120120 # -c ././deps/constraints.txt
121121 # paddlepaddle
122122pyclipper==1.3.0.post6
123123 # via unstructured-paddleocr
124- pydantic==2.11.3
124+ pydantic==2.11.5
125125 # via albumentations
126- pydantic-core==2.33.1
126+ pydantic-core==2.33.2
127127 # via pydantic
128128python-docx==1.1.2
129129 # via unstructured-paddleocr
@@ -147,7 +147,7 @@ scipy==1.13.1
147147 # scikit-image
148148shapely==2.0.7
149149 # via unstructured-paddleocr
150- simsimd==6.2.1
150+ simsimd==6.4.7
151151 # via albucore
152152sniffio==1.3.1
153153 # via
@@ -159,27 +159,28 @@ soupsieve==2.7
159159 # beautifulsoup4
160160stringzilla==3.12.5
161161 # via albucore
162- termcolor==3.0.1
162+ termcolor==3.1.0
163163 # via fire
164164tifffile==2024.8.30
165165 # via scikit-image
166166tqdm==4.67.1
167167 # via
168168 # -c ./base.txt
169169 # unstructured-paddleocr
170- typing-extensions==4.13.2
170+ typing-extensions==4.14.0
171171 # via
172172 # -c ./base.txt
173173 # albucore
174174 # albumentations
175175 # anyio
176176 # beautifulsoup4
177+ # exceptiongroup
177178 # paddlepaddle
178179 # pydantic
179180 # pydantic-core
180181 # python-docx
181182 # typing-inspection
182- typing-inspection==0.4.0
183+ typing-inspection==0.4.1
183184 # via pydantic
184185unstructured-paddleocr==2.10.0
185186 # via -r ./extra-paddleocr.in
You can’t perform that action at this time.
0 commit comments