Skip to content

Commit f91ce3a

Browse files
authored
build: 0.0.77 release; bump to unstructured==0.15.5 (#450)
### Summary Bumps to `unstructured==0.15.5`. Also pulls in the latest version of the `wolfi` base image.
1 parent 7468938 commit f91ce3a

File tree

7 files changed

+57
-61
lines changed

7 files changed

+57
-61
lines changed

CHANGELOG.md

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,7 @@
1+
## 0.0.77
2+
3+
* Bump to `unstructured` 0.15.5
4+
15
## 0.0.76
26
* Use the library's `detect_filetype` in API to determine mimetype
37
* Add content_type api parameter

Dockerfile

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
11
# syntax=docker/dockerfile:experimental
2-
FROM quay.io/unstructured-io/base-images:wolfi-base-e48da6b@sha256:8ad3479e5dc87a86e4794350cca6385c01c6d110902c5b292d1a62e231be711b as base
2+
FROM quay.io/unstructured-io/base-images:wolfi-base-latest as base
33

44
# NOTE(crag): NB_USER ARG for mybinder.org compat:
55
# https://mybinder.readthedocs.io/en/latest/tutorials/dockerfile.html

prepline_general/api/app.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -13,7 +13,7 @@
1313
app = FastAPI(
1414
title="Unstructured Pipeline API",
1515
summary="Partition documents with the Unstructured library",
16-
version="0.0.76",
16+
version="0.0.77",
1717
docs_url="/general/docs",
1818
openapi_url="/general/openapi.json",
1919
servers=[

prepline_general/api/general.py

Lines changed: 3 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -619,7 +619,7 @@ async def stream_response(self, send: Send) -> None:
619619
)
620620
async for chunk in self.body_iterator:
621621
if not isinstance(chunk, bytes):
622-
chunk = chunk.encode(self.charset)
622+
chunk = chunk.encode(self.charset) # type: ignore
623623
chunk = b64encode(chunk)
624624
await send(
625625
{"type": "http.response.body", "body": self.build_part(chunk), "more_body": True}
@@ -649,7 +649,7 @@ def return_content_type(filename: str):
649649

650650

651651
@router.get("/general/v0/general", include_in_schema=False)
652-
@router.get("/general/v0.0.76/general", include_in_schema=False)
652+
@router.get("/general/v0.0.77/general", include_in_schema=False)
653653
async def handle_invalid_get_request():
654654
raise HTTPException(
655655
status_code=status.HTTP_405_METHOD_NOT_ALLOWED, detail="Only POST requests are supported."
@@ -664,7 +664,7 @@ async def handle_invalid_get_request():
664664
description="Description",
665665
operation_id="partition_parameters",
666666
)
667-
@router.post("/general/v0.0.76/general", include_in_schema=False)
667+
@router.post("/general/v0.0.77/general", include_in_schema=False)
668668
def general_partition(
669669
request: Request,
670670
# cannot use annotated type here because of a bug described here:

preprocessing-pipeline-family.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,2 @@
11
name: general
2-
version: 0.0.76
2+
version: 0.0.77

requirements/base.txt

Lines changed: 20 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@ certifi==2024.7.4
2626
# httpx
2727
# requests
2828
# unstructured-client
29-
cffi==1.16.0
29+
cffi==1.17.0
3030
# via cryptography
3131
chardet==5.2.0
3232
# via unstructured
@@ -65,7 +65,7 @@ et-xmlfile==1.1.0
6565
# via openpyxl
6666
exceptiongroup==1.2.2
6767
# via anyio
68-
fastapi==0.112.0
68+
fastapi==0.112.1
6969
# via -r requirements/base.in
7070
filelock==3.15.4
7171
# via
@@ -84,7 +84,7 @@ fsspec==2024.6.1
8484
# torch
8585
google-api-core[grpc]==2.19.1
8686
# via google-cloud-vision
87-
google-auth==2.32.0
87+
google-auth==2.33.0
8888
# via
8989
# google-api-core
9090
# google-cloud-vision
@@ -136,7 +136,7 @@ langdetect==1.0.9
136136
# via unstructured
137137
layoutparser==0.3.4
138138
# via unstructured-inference
139-
lxml==5.2.2
139+
lxml==5.3.0
140140
# via
141141
# pikepdf
142142
# python-docx
@@ -150,7 +150,7 @@ marshmallow==3.21.3
150150
# via
151151
# dataclasses-json
152152
# unstructured-client
153-
matplotlib==3.9.0
153+
matplotlib==3.9.2
154154
# via
155155
# pycocotools
156156
# unstructured-inference
@@ -191,7 +191,7 @@ onnx==1.16.2
191191
# via
192192
# unstructured
193193
# unstructured-inference
194-
onnxruntime==1.18.1
194+
onnxruntime==1.19.0
195195
# via unstructured-inference
196196
opencv-python==4.10.0.84
197197
# via
@@ -208,7 +208,6 @@ packaging==24.1
208208
# matplotlib
209209
# onnxruntime
210210
# pikepdf
211-
# pytesseract
212211
# transformers
213212
# unstructured-client
214213
# unstructured-pytesseract
@@ -224,9 +223,9 @@ pdfminer-six==20231228
224223
# via
225224
# pdfplumber
226225
# unstructured
227-
pdfplumber==0.11.2
226+
pdfplumber==0.11.3
228227
# via layoutparser
229-
pikepdf==9.1.0
228+
pikepdf==9.1.1
230229
# via unstructured
231230
pillow==10.4.0
232231
# via
@@ -236,7 +235,6 @@ pillow==10.4.0
236235
# pdfplumber
237236
# pikepdf
238237
# pillow-heif
239-
# pytesseract
240238
# python-pptx
241239
# torchvision
242240
# unstructured-pytesseract
@@ -288,8 +286,6 @@ pypdf==4.3.1
288286
# unstructured-client
289287
pypdfium2==4.30.0
290288
# via pdfplumber
291-
pytesseract==0.3.10
292-
# via unstructured
293289
python-dateutil==2.9.0.post0
294290
# via
295291
# matplotlib
@@ -305,18 +301,18 @@ python-multipart==0.0.9
305301
# via unstructured-inference
306302
python-oxmsg==0.0.1
307303
# via unstructured
308-
python-pptx==0.6.23
304+
python-pptx==1.0.2
309305
# via unstructured
310306
pytz==2024.1
311307
# via pandas
312-
pyyaml==6.0.1
308+
pyyaml==6.0.2
313309
# via
314310
# huggingface-hub
315311
# layoutparser
316312
# omegaconf
317313
# timm
318314
# transformers
319-
rapidfuzz==3.9.5
315+
rapidfuzz==3.9.6
320316
# via
321317
# unstructured
322318
# unstructured-inference
@@ -354,11 +350,11 @@ sniffio==1.3.1
354350
# via
355351
# anyio
356352
# httpx
357-
soupsieve==2.5
353+
soupsieve==2.6
358354
# via beautifulsoup4
359-
starlette==0.37.2
355+
starlette==0.38.2
360356
# via fastapi
361-
sympy==1.13.1
357+
sympy==1.13.2
362358
# via
363359
# onnxruntime
364360
# torch
@@ -387,7 +383,7 @@ tqdm==4.66.5
387383
# nltk
388384
# transformers
389385
# unstructured
390-
transformers==4.43.4
386+
transformers==4.44.0
391387
# via unstructured-inference
392388
typing-extensions==4.12.2
393389
# via
@@ -401,6 +397,7 @@ typing-extensions==4.12.2
401397
# pypdf
402398
# python-docx
403399
# python-oxmsg
400+
# python-pptx
404401
# torch
405402
# typing-inspect
406403
# unstructured
@@ -412,19 +409,19 @@ typing-inspect==0.9.0
412409
# unstructured-client
413410
tzdata==2024.1
414411
# via pandas
415-
unstructured[all-docs]==0.15.1
412+
unstructured[all-docs]==0.15.5
416413
# via -r requirements/base.in
417-
unstructured-client==0.25.2
414+
unstructured-client==0.25.5
418415
# via unstructured
419416
unstructured-inference==0.7.36
420417
# via unstructured
421-
unstructured-pytesseract==0.3.12
418+
unstructured-pytesseract==0.3.13
422419
# via unstructured
423420
urllib3==2.2.2
424421
# via
425422
# requests
426423
# unstructured-client
427-
uvicorn==0.30.5
424+
uvicorn==0.30.6
428425
# via -r requirements/base.in
429426
wrapt==1.16.0
430427
# via

0 commit comments

Comments
 (0)