Skip to content

Commit c7eba16

Browse files
authored
build(deps): make pip-compile (#307)
* build: pip-compile, skip test deps * s
1 parent 5eaf449 commit c7eba16

File tree

11 files changed

+62
-41
lines changed

11 files changed

+62
-41
lines changed

CHANGELOG.md

Lines changed: 8 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -1,3 +1,11 @@
1+
## 0.4.17-dev0
2+
3+
### Enhancements
4+
5+
### Features
6+
7+
### Fixes
8+
19
## 0.4.16
210

311
### Enhancements

requirements/base.txt

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -20,10 +20,6 @@ charset-normalizer==3.0.1
2020
# via requests
2121
click==8.1.3
2222
# via nltk
23-
colorama==0.4.6
24-
# via
25-
# click
26-
# tqdm
2723
deprecated==1.2.13
2824
# via argilla
2925
et-xmlfile==1.1.0

requirements/build.txt

Lines changed: 0 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -16,8 +16,6 @@ certifi==2022.12.7
1616
# requests
1717
charset-normalizer==3.0.1
1818
# via requests
19-
colorama==0.4.6
20-
# via sphinx
2119
docutils==0.18.1
2220
# via
2321
# sphinx

requirements/dev.txt

Lines changed: 11 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -6,6 +6,10 @@
66
#
77
anyio==3.6.2
88
# via jupyter-server
9+
appnope==0.1.3
10+
# via
11+
# ipykernel
12+
# ipython
913
argon2-cffi==21.3.0
1014
# via
1115
# jupyter-server
@@ -31,11 +35,6 @@ cffi==1.15.1
3135
# via argon2-cffi-bindings
3236
click==8.1.3
3337
# via pip-tools
34-
colorama==0.4.6
35-
# via
36-
# build
37-
# click
38-
# ipython
3938
comm==0.1.2
4039
# via ipykernel
4140
debugpy==1.6.6
@@ -108,7 +107,7 @@ jupyter-client==8.0.3
108107
# nbclient
109108
# notebook
110109
# qtconsole
111-
jupyter-console==6.6.1
110+
jupyter-console==6.6.2
112111
# via jupyter
113112
jupyter-core==5.2.0
114113
# via
@@ -182,6 +181,8 @@ pandocfilters==1.5.0
182181
# via nbconvert
183182
parso==0.8.3
184183
# via jedi
184+
pexpect==4.8.0
185+
# via ipython
185186
pickleshare==0.7.5
186187
# via ipython
187188
pip-tools==6.12.2
@@ -201,6 +202,10 @@ prompt-toolkit==3.0.37
201202
# jupyter-console
202203
psutil==5.9.4
203204
# via ipykernel
205+
ptyprocess==0.7.0
206+
# via
207+
# pexpect
208+
# terminado
204209
pure-eval==0.2.2
205210
# via stack-data
206211
pycparser==2.21

requirements/huggingface.txt

Lines changed: 0 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -22,10 +22,6 @@ click==8.1.3
2222
# via
2323
# nltk
2424
# sacremoses
25-
colorama==0.4.6
26-
# via
27-
# click
28-
# tqdm
2925
deprecated==1.2.13
3026
# via argilla
3127
et-xmlfile==1.1.0

requirements/ingest-github.txt

Lines changed: 15 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ anyio==3.6.2
88
# via
99
# -r requirements/base.txt
1010
# httpcore
11-
argilla==1.3.0
11+
argilla==1.3.1
1212
# via
1313
# -r requirements/base.txt
1414
# unstructured (setup.py)
@@ -33,10 +33,6 @@ click==8.1.3
3333
# via
3434
# -r requirements/base.txt
3535
# nltk
36-
colorama==0.4.6
37-
# via
38-
# click
39-
# tqdm
4036
deprecated==1.2.13
4137
# via
4238
# -r requirements/base.txt
@@ -64,6 +60,10 @@ idna==3.4
6460
# anyio
6561
# requests
6662
# rfc3986
63+
importlib-metadata==6.0.0
64+
# via
65+
# -r requirements/base.txt
66+
# markdown
6767
joblib==1.2.0
6868
# via
6969
# -r requirements/base.txt
@@ -74,6 +74,10 @@ lxml==4.9.2
7474
# python-docx
7575
# python-pptx
7676
# unstructured (setup.py)
77+
markdown==3.4.1
78+
# via
79+
# -r requirements/base.txt
80+
# unstructured (setup.py)
7781
monotonic==1.6
7882
# via
7983
# -r requirements/base.txt
@@ -107,7 +111,7 @@ pillow==9.4.0
107111
# unstructured (setup.py)
108112
pycparser==2.21
109113
# via cffi
110-
pydantic==1.10.4
114+
pydantic==1.10.5
111115
# via
112116
# -r requirements/base.txt
113117
# argilla
@@ -165,7 +169,7 @@ tqdm==4.64.1
165169
# -r requirements/base.txt
166170
# argilla
167171
# nltk
168-
typing-extensions==4.4.0
172+
typing-extensions==4.5.0
169173
# via
170174
# -r requirements/base.txt
171175
# pydantic
@@ -182,3 +186,7 @@ xlsxwriter==3.0.8
182186
# via
183187
# -r requirements/base.txt
184188
# python-pptx
189+
zipp==3.15.0
190+
# via
191+
# -r requirements/base.txt
192+
# importlib-metadata

requirements/ingest-reddit.txt

Lines changed: 12 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -57,6 +57,10 @@ idna==3.4
5757
# anyio
5858
# requests
5959
# rfc3986
60+
importlib-metadata==6.0.0
61+
# via
62+
# -r requirements/base.txt
63+
# markdown
6064
joblib==1.2.0
6165
# via
6266
# -r requirements/base.txt
@@ -67,6 +71,10 @@ lxml==4.9.2
6771
# python-docx
6872
# python-pptx
6973
# unstructured (setup.py)
74+
markdown==3.4.1
75+
# via
76+
# -r requirements/base.txt
77+
# unstructured (setup.py)
7078
monotonic==1.6
7179
# via
7280
# -r requirements/base.txt
@@ -176,3 +184,7 @@ xlsxwriter==3.0.8
176184
# via
177185
# -r requirements/base.txt
178186
# python-pptx
187+
zipp==3.15.0
188+
# via
189+
# -r requirements/base.txt
190+
# importlib-metadata

requirements/ingest-s3.txt

Lines changed: 2 additions & 7 deletions
Original file line numberDiff line numberDiff line change
@@ -16,9 +16,9 @@ backoff==2.2.1
1616
# via
1717
# -r requirements/base.txt
1818
# argilla
19-
boto3==1.26.79
19+
boto3==1.26.80
2020
# via unstructured (setup.py)
21-
botocore==1.29.79
21+
botocore==1.29.80
2222
# via
2323
# boto3
2424
# s3transfer
@@ -37,11 +37,6 @@ click==8.1.3
3737
# via
3838
# -r requirements/base.txt
3939
# nltk
40-
colorama==0.4.6
41-
# via
42-
# -r requirements/base.txt
43-
# click
44-
# tqdm
4540
deprecated==1.2.13
4641
# via
4742
# -r requirements/base.txt

requirements/local-inference.txt

Lines changed: 4 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -30,10 +30,6 @@ click==8.1.3
3030
# via
3131
# nltk
3232
# uvicorn
33-
colorama==0.4.6
34-
# via
35-
# click
36-
# tqdm
3733
coloredlogs==15.0.1
3834
# via onnxruntime
3935
contourpy==1.0.7
@@ -122,7 +118,7 @@ numpy==1.23.5
122118
# transformers
123119
omegaconf==2.3.0
124120
# via effdet
125-
onnxruntime==1.13.1
121+
onnxruntime==1.14.1
126122
# via unstructured-inference
127123
opencv-python==4.6.0.66
128124
# via
@@ -173,8 +169,6 @@ pydantic==1.10.5
173169
# fastapi
174170
pyparsing==3.0.9
175171
# via matplotlib
176-
pyreadline3==3.4.1
177-
# via humanfriendly
178172
pytesseract==0.3.10
179173
# via layoutparser
180174
python-dateutil==2.8.2
@@ -272,4 +266,6 @@ wrapt==1.14.1
272266
xlsxwriter==3.0.8
273267
# via python-pptx
274268
zipp==3.15.0
275-
# via importlib-resources
269+
# via
270+
# importlib-metadata
271+
# importlib-resources

test_unstructured_ingest/test-ingest-github.sh

Lines changed: 9 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -3,16 +3,23 @@
33
SCRIPT_DIR=$( cd -- "$( dirname -- "${BASH_SOURCE[0]}" )" &> /dev/null && pwd )
44
cd "$SCRIPT_DIR"/.. || exit 1
55

6+
if [[ "$CI" == "true" && "$(( RANDOM % 10))" != "1" ]]; then
7+
# NOTE(crag): proper fix is being tracked here: https://github.com/Unstructured-IO/unstructured/issues/306
8+
echo "Skipping ingest 90% of github ingest tests to avoid rate limiting issue."
9+
exit 0
10+
fi
11+
12+
613
PYTHONPATH=. ./unstructured/ingest/main.py --github-url dcneiner/Downloadify --github-file-glob '*.html,*.txt' --structured-output-dir github-downloadify-output --verbose
714

815
if ! diff -ru github-downloadify-output test_unstructured_ingest/expected-structured-output/github-downloadify ; then
916
echo
1017
echo "There are differences from the previously checked-in structured outputs."
1118
echo
1219
echo "If these differences are acceptable, copy the outputs from"
13-
echo "s3-small-batch-output/ to test_unstructured_ingest/expected-structured-output/s3-small-batch/ after running"
20+
echo "github-downloadify-output/ to test_unstructured_ingest/expected-structured-output/github-downloadify/ after running"
1421
echo
15-
echo " PYTHONPATH=. python examples/ingest/s3-small-batch/main.py --structured-output-dir s3-small-batch-output"
22+
echo " PYTHONPATH=. ./unstructured/ingest/main.py --github-url dcneiner/Downloadify --github-file-glob '*.html,*.txt' --structured-output-dir github-downloadify-output --verbose"
1623
echo
1724
exit 1
1825
fi

0 commit comments

Comments
 (0)