Skip to content

Commit 305247b

Browse files
authored
chore: bump unstructured-inference pin (#2913)
**Summary** Update dependencies to use the new version of `unstructured-inference` released yesterday. Remedy a few small problems with `make pip-compile` that stood in the way.
1 parent 9ad2993 commit 305247b

34 files changed

+133
-134
lines changed

Diff for: CHANGELOG.md

+1-1
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,4 @@
1-
## 0.13.3-dev9
1+
## 0.13.3
22

33
### Enhancements
44

Diff for: requirements/Makefile

+2-2
Original file line numberDiff line numberDiff line change
@@ -24,11 +24,11 @@ compile-base:
2424

2525
.PHONY: compile-all-base
2626
compile-all-base: compile-base compile-test compile-dev
27-
@$(foreach file,$(BASE_REQUIREMENTS),echo "compiling: $(file)" && pip-compile --upgrade $(file);)
27+
@$(foreach file,$(BASE_REQUIREMENTS),echo -e "\n\ncompiling: $(file)" && pip-compile --no-strip-extras --upgrade $(file) || exit;)
2828

2929
.PHONY: compile-ingest
3030
compile-ingest:
31-
@$(foreach file,$(INGEST_REQUIREMENTS),echo "compiling: $(file)" && pip-compile --upgrade $(file);)
31+
@$(foreach file,$(INGEST_REQUIREMENTS),echo -e "\n\ncompiling: $(file)" && pip-compile --no-strip-extras --upgrade $(file) || exit;)
3232

3333
.PHONY: clean
3434
clean: clean-base clean-ingest

Diff for: requirements/base.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -69,7 +69,7 @@ python-magic==0.4.27
6969
# via -r ./base.in
7070
rapidfuzz==3.8.1
7171
# via -r ./base.in
72-
regex==2023.12.25
72+
regex==2024.4.16
7373
# via nltk
7474
requests==2.31.0
7575
# via

Diff for: requirements/deps/constraints.txt

-3
Original file line numberDiff line numberDiff line change
@@ -22,8 +22,6 @@ Office365-REST-Python-Client<2.4.3
2222
# unstructured-inference to be upgraded when unstructured library is upgraded
2323
# https://github.com/Unstructured-IO/unstructured/issues/1458
2424
# unstructured-inference
25-
# unable to build wheel for arm on 0.3.3+
26-
safetensors<=0.3.2
2725
# use the known compatible version of weaviate and unstructured.pytesseract
2826
unstructured.pytesseract>=0.3.12
2927
weaviate-client>3.25.0
@@ -38,7 +36,6 @@ torch>2
3836
# pinned in unstructured paddleocr
3937
opencv-python==4.8.0.76
4038
opencv-contrib-python==4.8.0.76
41-
onnxruntime==1.15.1
4239
platformdirs==3.10.0
4340

4441
# TODO: Constraint due to langchain, remove when that gets updated:

Diff for: requirements/dev.txt

+7-7
Original file line numberDiff line numberDiff line change
@@ -73,7 +73,7 @@ defusedxml==0.7.1
7373
# via nbconvert
7474
distlib==0.3.8
7575
# via virtualenv
76-
exceptiongroup==1.2.0
76+
exceptiongroup==1.2.1
7777
# via
7878
# -c ./test.txt
7979
# anyio
@@ -91,7 +91,7 @@ httpcore==1.0.5
9191
# via httpx
9292
httpx==0.27.0
9393
# via jupyterlab
94-
identify==2.5.35
94+
identify==2.5.36
9595
# via pre-commit
9696
idna==3.7
9797
# via
@@ -195,7 +195,7 @@ markupsafe==2.1.5
195195
# via
196196
# jinja2
197197
# nbconvert
198-
matplotlib-inline==0.1.6
198+
matplotlib-inline==0.1.7
199199
# via
200200
# ipykernel
201201
# ipython
@@ -216,7 +216,7 @@ nest-asyncio==1.6.0
216216
# via ipykernel
217217
nodeenv==1.8.0
218218
# via pre-commit
219-
notebook==7.1.2
219+
notebook==7.1.3
220220
# via jupyter
221221
notebook-shim==0.2.4
222222
# via
@@ -294,7 +294,7 @@ pyyaml==6.0.1
294294
# -c ./test.txt
295295
# jupyter-events
296296
# pre-commit
297-
pyzmq==25.1.2
297+
pyzmq==26.0.2
298298
# via
299299
# ipykernel
300300
# jupyter-client
@@ -368,7 +368,7 @@ tornado==6.4
368368
# jupyterlab
369369
# notebook
370370
# terminado
371-
traitlets==5.14.2
371+
traitlets==5.14.3
372372
# via
373373
# comm
374374
# ipykernel
@@ -401,7 +401,7 @@ urllib3==1.26.18
401401
# -c ./base.txt
402402
# -c ./test.txt
403403
# requests
404-
virtualenv==20.25.1
404+
virtualenv==20.25.3
405405
# via pre-commit
406406
wcwidth==0.2.13
407407
# via prompt-toolkit

Diff for: requirements/extra-paddleocr.txt

+3-3
Original file line numberDiff line numberDiff line change
@@ -63,7 +63,7 @@ importlib-metadata==7.1.0
6363
# via flask
6464
importlib-resources==6.4.0
6565
# via matplotlib
66-
itsdangerous==2.1.2
66+
itsdangerous==2.2.0
6767
# via flask
6868
jinja2==3.1.3
6969
# via
@@ -188,7 +188,7 @@ scipy==1.10.1
188188
# -c ././deps/constraints.txt
189189
# imgaug
190190
# scikit-image
191-
shapely==2.0.3
191+
shapely==2.0.4
192192
# via
193193
# imgaug
194194
# unstructured-paddleocr
@@ -200,7 +200,7 @@ six==1.16.0
200200
# imgaug
201201
# python-dateutil
202202
# visualdl
203-
tifffile==2024.2.12
203+
tifffile==2024.4.18
204204
# via scikit-image
205205
tqdm==4.66.2
206206
# via

Diff for: requirements/extra-pdf-image.in

+1-1
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,7 @@ pillow_heif
99
pypdf
1010
# Do not move to constraints.in, otherwise unstructured-inference will not be upgraded
1111
# when unstructured library is.
12-
unstructured-inference==0.7.25
12+
unstructured-inference==0.7.27
1313
# unstructured fork of pytesseract that provides an interface to allow for multiple output formats
1414
# from one tesseract call
1515
unstructured.pytesseract>=0.3.12

Diff for: requirements/extra-pdf-image.txt

+8-11
Original file line numberDiff line numberDiff line change
@@ -100,10 +100,8 @@ onnx==1.16.0
100100
# via
101101
# -r ./extra-pdf-image.in
102102
# unstructured-inference
103-
onnxruntime==1.15.1
104-
# via
105-
# -c ././deps/constraints.txt
106-
# unstructured-inference
103+
onnxruntime==1.17.3
104+
# via unstructured-inference
107105
opencv-python==4.8.0.76
108106
# via
109107
# -c ././deps/constraints.txt
@@ -132,7 +130,7 @@ pdfminer-six==20231228
132130
# pdfplumber
133131
pdfplumber==0.11.0
134132
# via layoutparser
135-
pikepdf==8.15.0
133+
pikepdf==8.15.1
136134
# via -r ./extra-pdf-image.in
137135
pillow==10.3.0
138136
# via
@@ -190,7 +188,7 @@ rapidfuzz==3.8.1
190188
# via
191189
# -c ./base.txt
192190
# unstructured-inference
193-
regex==2023.12.25
191+
regex==2024.4.16
194192
# via
195193
# -c ./base.txt
196194
# transformers
@@ -199,9 +197,8 @@ requests==2.31.0
199197
# -c ./base.txt
200198
# huggingface-hub
201199
# transformers
202-
safetensors==0.3.2
200+
safetensors==0.4.3
203201
# via
204-
# -c ././deps/constraints.txt
205202
# timm
206203
# transformers
207204
scipy==1.10.1
@@ -218,7 +215,7 @@ sympy==1.12
218215
# torch
219216
timm==0.9.16
220217
# via effdet
221-
tokenizers==0.15.2
218+
tokenizers==0.19.1
222219
# via transformers
223220
torch==2.2.2
224221
# via
@@ -238,7 +235,7 @@ tqdm==4.66.2
238235
# huggingface-hub
239236
# iopath
240237
# transformers
241-
transformers==4.37.1
238+
transformers==4.40.0
242239
# via unstructured-inference
243240
typing-extensions==4.11.0
244241
# via
@@ -249,7 +246,7 @@ typing-extensions==4.11.0
249246
# torch
250247
tzdata==2024.1
251248
# via pandas
252-
unstructured-inference==0.7.25
249+
unstructured-inference==0.7.27
253250
# via -r ./extra-pdf-image.in
254251
unstructured-pytesseract==0.3.12
255252
# via

Diff for: requirements/huggingface.txt

+5-7
Original file line numberDiff line numberDiff line change
@@ -64,7 +64,7 @@ pyyaml==6.0.1
6464
# via
6565
# huggingface-hub
6666
# transformers
67-
regex==2023.12.25
67+
regex==2024.4.16
6868
# via
6969
# -c ./base.txt
7070
# sacremoses
@@ -76,10 +76,8 @@ requests==2.31.0
7676
# transformers
7777
sacremoses==0.1.1
7878
# via -r ./huggingface.in
79-
safetensors==0.3.2
80-
# via
81-
# -c ././deps/constraints.txt
82-
# transformers
79+
safetensors==0.4.3
80+
# via transformers
8381
sentencepiece==0.2.0
8482
# via -r ./huggingface.in
8583
six==1.16.0
@@ -88,7 +86,7 @@ six==1.16.0
8886
# langdetect
8987
sympy==1.12
9088
# via torch
91-
tokenizers==0.15.2
89+
tokenizers==0.19.1
9290
# via transformers
9391
torch==2.2.2
9492
# via
@@ -100,7 +98,7 @@ tqdm==4.66.2
10098
# huggingface-hub
10199
# sacremoses
102100
# transformers
103-
transformers==4.37.1
101+
transformers==4.40.0
104102
# via -r ./huggingface.in
105103
typing-extensions==4.11.0
106104
# via

Diff for: requirements/ingest/astra.txt

+5-3
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ bson==0.5.10
1414
# via astrapy
1515
cassandra-driver==3.29.1
1616
# via cassio
17-
cassio==0.1.5
17+
cassio==0.1.6
1818
# via astrapy
1919
certifi==2024.2.2
2020
# via
@@ -33,7 +33,7 @@ click==8.1.7
3333
# geomet
3434
deprecation==2.1.0
3535
# via astrapy
36-
exceptiongroup==1.2.0
36+
exceptiongroup==1.2.1
3737
# via anyio
3838
geomet==0.2.1.post1
3939
# via cassandra-driver
@@ -46,7 +46,9 @@ hpack==4.0.0
4646
httpcore==1.0.5
4747
# via httpx
4848
httpx[http2]==0.27.0
49-
# via astrapy
49+
# via
50+
# astrapy
51+
# httpx
5052
hyperframe==6.0.1
5153
# via h2
5254
idna==3.7

Diff for: requirements/ingest/azure.txt

+5-3
Original file line numberDiff line numberDiff line change
@@ -4,9 +4,9 @@
44
#
55
# pip-compile ./ingest/azure.in
66
#
7-
adlfs==2024.2.0
7+
adlfs==2024.4.1
88
# via -r ./ingest/azure.in
9-
aiohttp==3.9.4
9+
aiohttp==3.9.5
1010
# via adlfs
1111
aiosignal==1.3.1
1212
# via aiohttp
@@ -80,7 +80,9 @@ portalocker==2.8.2
8080
pycparser==2.22
8181
# via cffi
8282
pyjwt[crypto]==2.8.0
83-
# via msal
83+
# via
84+
# msal
85+
# pyjwt
8486
requests==2.31.0
8587
# via
8688
# -c ./ingest/../base.txt

Diff for: requirements/ingest/box.txt

+3-1
Original file line numberDiff line numberDiff line change
@@ -9,7 +9,9 @@ attrs==23.2.0
99
boxfs==0.3.0
1010
# via -r ./ingest/box.in
1111
boxsdk[jwt]==3.9.2
12-
# via boxfs
12+
# via
13+
# boxfs
14+
# boxsdk
1315
certifi==2024.2.2
1416
# via
1517
# -c ./ingest/../base.txt

Diff for: requirements/ingest/chroma.txt

+10-10
Original file line numberDiff line numberDiff line change
@@ -44,9 +44,9 @@ coloredlogs==15.0.1
4444
# via onnxruntime
4545
deprecated==1.2.14
4646
# via opentelemetry-api
47-
exceptiongroup==1.2.0
47+
exceptiongroup==1.2.1
4848
# via anyio
49-
fastapi==0.110.1
49+
fastapi==0.110.2
5050
# via chromadb
5151
filelock==3.13.4
5252
# via huggingface-hub
@@ -58,7 +58,7 @@ google-auth==2.29.0
5858
# via kubernetes
5959
googleapis-common-protos==1.63.0
6060
# via opentelemetry-exporter-otlp-proto-grpc
61-
grpcio==1.62.1
61+
grpcio==1.62.2
6262
# via
6363
# chromadb
6464
# opentelemetry-exporter-otlp-proto-grpc
@@ -95,10 +95,8 @@ oauthlib==3.2.2
9595
# via
9696
# kubernetes
9797
# requests-oauthlib
98-
onnxruntime==1.15.1
99-
# via
100-
# -c ./ingest/../deps/constraints.txt
101-
# chromadb
98+
onnxruntime==1.17.3
99+
# via chromadb
102100
opentelemetry-api==1.16.0
103101
# via
104102
# chromadb
@@ -131,7 +129,7 @@ protobuf==4.23.4
131129
# googleapis-common-protos
132130
# onnxruntime
133131
# opentelemetry-proto
134-
pulsar-client==3.4.0
132+
pulsar-client==3.5.0
135133
# via chromadb
136134
pyasn1==0.6.0
137135
# via
@@ -186,7 +184,7 @@ sympy==1.12
186184
# via onnxruntime
187185
tenacity==8.2.3
188186
# via chromadb
189-
tokenizers==0.15.2
187+
tokenizers==0.19.1
190188
# via chromadb
191189
tqdm==4.66.2
192190
# via
@@ -216,7 +214,9 @@ urllib3==1.26.18
216214
# kubernetes
217215
# requests
218216
uvicorn[standard]==0.29.0
219-
# via chromadb
217+
# via
218+
# chromadb
219+
# uvicorn
220220
uvloop==0.19.0
221221
# via uvicorn
222222
watchfiles==0.21.0

Diff for: requirements/ingest/clarifai.txt

+2-2
Original file line numberDiff line numberDiff line change
@@ -13,15 +13,15 @@ charset-normalizer==3.3.2
1313
# via
1414
# -c ./ingest/../base.txt
1515
# requests
16-
clarifai==10.3.0
16+
clarifai==10.3.1
1717
# via -r ./ingest/clarifai.in
1818
clarifai-grpc==10.2.3
1919
# via clarifai
2020
contextlib2==21.6.0
2121
# via schema
2222
googleapis-common-protos==1.63.0
2323
# via clarifai-grpc
24-
grpcio==1.62.1
24+
grpcio==1.62.2
2525
# via clarifai-grpc
2626
idna==3.7
2727
# via

0 commit comments

Comments
 (0)