Skip to content

Commit ab7bc82

Browse files
authored
Chore: Bump unstructured to 0.10.30 (#309)
^^^ Also releasing this version since `0.10.30` include some 500 error bug fix
1 parent 776d812 commit ab7bc82

File tree

8 files changed

+78
-49
lines changed

8 files changed

+78
-49
lines changed

CHANGELOG.md

Lines changed: 4 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,7 @@
1+
## 0.0.58
2+
3+
* Bump unstructured to 0.10.30
4+
15
## 0.0.57
26
* Make sure `multipage_sections` param defaults to `true` as per the readme
37
* Bump unstructured to 0.10.29

Dockerfile

Lines changed: 4 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -32,10 +32,12 @@ RUN python3.10 -m pip install pip==${PIP_VERSION} \
3232
USER ${NB_USER}
3333

3434
FROM python-deps as model-deps
35-
35+
# Note(yuming): quick workaround for ingest import error
36+
# should import initialize within unstructured but out of ingest dir
37+
COPY --chown=${NB_USER}:${NB_USER} scripts/hi_res_model_initialize.py hi_res_model_initialize.py
3638
RUN python3.10 -c "import nltk; nltk.download('punkt')" && \
3739
python3.10 -c "import nltk; nltk.download('averaged_perceptron_tagger')" && \
38-
python3.10 -c "from unstructured.ingest.pipeline.initialize import initialize; initialize()"
40+
python3.10 -c "from hi_res_model_initialize import initialize; initialize()"
3941

4042
FROM model-deps as code
4143
COPY --chown=${NB_USER}:${NB_USER} CHANGELOG.md CHANGELOG.md

prepline_general/api/app.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -11,7 +11,7 @@
1111
app = FastAPI(
1212
title="Unstructured Pipeline API",
1313
description="""""",
14-
version="0.0.57",
14+
version="0.0.58",
1515
docs_url="/general/docs",
1616
openapi_url="/general/openapi.json",
1717
)

prepline_general/api/general.py

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -636,7 +636,7 @@ def return_content_type(filename):
636636

637637

638638
@router.post("/general/v0/general")
639-
@router.post("/general/v0.0.57/general")
639+
@router.post("/general/v0.0.58/general")
640640
def pipeline_1(
641641
request: Request,
642642
gz_uncompressed_content_type: Optional[str] = Form(default=None),

preprocessing-pipeline-family.yaml

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,2 +1,2 @@
11
name: general
2-
version: 0.0.57
2+
version: 0.0.58

requirements/base.txt

Lines changed: 17 additions & 15 deletions
Original file line numberDiff line numberDiff line change
@@ -39,7 +39,7 @@ cryptography==41.0.5
3939
# via pdfminer-six
4040
cycler==0.12.1
4141
# via matplotlib
42-
dataclasses-json==0.6.1
42+
dataclasses-json==0.6.2
4343
# via unstructured
4444
effdet==0.4.1
4545
# via layoutparser
@@ -58,15 +58,15 @@ filetype==1.2.0
5858
# via unstructured
5959
flatbuffers==23.5.26
6060
# via onnxruntime
61-
fonttools==4.44.0
61+
fonttools==4.44.3
6262
# via matplotlib
6363
fsspec==2023.10.0
6464
# via
6565
# huggingface-hub
6666
# torch
6767
h11==0.14.0
6868
# via uvicorn
69-
huggingface-hub==0.17.3
69+
huggingface-hub==0.19.3
7070
# via
7171
# timm
7272
# tokenizers
@@ -115,7 +115,7 @@ networkx==3.2.1
115115
# unstructured
116116
nltk==3.8.1
117117
# via unstructured
118-
numpy==1.26.1
118+
numpy==1.26.2
119119
# via
120120
# contourpy
121121
# layoutparser
@@ -154,7 +154,7 @@ packaging==23.2
154154
# pytesseract
155155
# transformers
156156
# unstructured-pytesseract
157-
pandas==2.1.2
157+
pandas==2.1.3
158158
# via
159159
# layoutparser
160160
# unstructured
@@ -200,9 +200,9 @@ pypandoc==1.12
200200
# via unstructured
201201
pyparsing==3.1.1
202202
# via matplotlib
203-
pypdf==3.17.0
203+
pypdf==3.17.1
204204
# via -r requirements/base.in
205-
pypdfium2==4.23.1
205+
pypdfium2==4.24.0
206206
# via pdfplumber
207207
pytesseract==0.3.10
208208
# via layoutparser
@@ -218,7 +218,7 @@ python-magic==0.4.27
218218
# via unstructured
219219
python-multipart==0.0.6
220220
# via unstructured-inference
221-
python-pptx==0.6.21
221+
python-pptx==0.6.23
222222
# via unstructured
223223
pytz==2023.3.post1
224224
# via pandas
@@ -271,15 +271,15 @@ tabulate==0.9.0
271271
# via unstructured
272272
timm==0.9.10
273273
# via effdet
274-
tokenizers==0.14.1
274+
tokenizers==0.15.0
275275
# via transformers
276-
torch==2.1.0
276+
torch==2.1.1
277277
# via
278278
# effdet
279279
# layoutparser
280280
# timm
281281
# torchvision
282-
torchvision==0.16.0
282+
torchvision==0.16.1
283283
# via
284284
# effdet
285285
# layoutparser
@@ -290,7 +290,7 @@ tqdm==4.66.1
290290
# iopath
291291
# nltk
292292
# transformers
293-
transformers==4.35.0
293+
transformers==4.35.2
294294
# via unstructured-inference
295295
typing-extensions==4.8.0
296296
# via
@@ -307,13 +307,15 @@ typing-inspect==0.9.0
307307
# via dataclasses-json
308308
tzdata==2023.3
309309
# via pandas
310-
unstructured[local-inference]==0.10.29
311-
# via -r requirements/base.in
310+
unstructured[local-inference]==0.10.30
311+
# via
312+
# -r requirements/base.in
313+
# unstructured
312314
unstructured-inference==0.7.11
313315
# via unstructured
314316
unstructured-pytesseract==0.3.12
315317
# via unstructured
316-
urllib3==2.0.7
318+
urllib3==2.1.0
317319
# via requests
318320
uvicorn==0.24.0.post1
319321
# via -r requirements/base.in

0 commit comments

Comments
 (0)