Skip to content

Commit 1ce8447

Browse files
authored
build(deps): bump unstructured inference; compile from setup.py (#176)
* bump unstructured inference; compile from setup.py * bump version * compile the local-inference extra * linting, linting, linting
1 parent 26a5546 commit 1ce8447

File tree

6 files changed

+84
-17
lines changed

6 files changed

+84
-17
lines changed

CHANGELOG.md

+2-1
Original file line numberDiff line numberDiff line change
@@ -1,11 +1,12 @@
1-
## 0.4.4-dev3
1+
## 0.4.4
22

33
* Updated `partition_pdf` and `partition_image` to return `unstructured` `Element` objects
44
* Fixed the healthcheck url path when partitioning images and PDFs via API
55
* Adds an optional `coordinates` attribute to document objects
66
* Adds `FigureCaption` and `CheckBox` document elements
77
* Added ability to split lists detected in `LayoutElement` objects
88
* Adds `partition_pptx` for partitioning PowerPoint documents
9+
* LayoutParser models now download from HugginfaceHub instead of DropBox
910
* Fixed file type detection for XML and HTML files on Amazone Linux
1011

1112
## 0.4.3

Makefile

+1-1
Original file line numberDiff line numberDiff line change
@@ -73,7 +73,7 @@ pip-compile:
7373
pip-compile requirements/dev.in
7474
pip-compile requirements/test.in
7575
pip-compile requirements/build.in
76-
pip-compile requirements/local-inference.in
76+
pip-compile --extra local-inference -o requirements/local-inference.txt
7777
# NOTE(robinson) - doc/requirements.txt is where the GitHub action for building
7878
# sphinx docs looks for additional requirements
7979
cp requirements/build.txt docs/requirements.txt

requirements/local-inference.in

-1
This file was deleted.

requirements/local-inference.txt

+79-12
Original file line numberDiff line numberDiff line change
@@ -2,56 +2,91 @@
22
# This file is autogenerated by pip-compile with Python 3.8
33
# by the following command:
44
#
5-
# pip-compile requirements/local-inference.in
5+
# pip-compile --extra=local-inference --output-file=requirements/local-inference.txt
66
#
77
antlr4-python3-runtime==4.9.3
88
# via omegaconf
99
anyio==3.6.2
10-
# via starlette
10+
# via
11+
# httpcore
12+
# starlette
13+
argilla==1.2.1
14+
# via unstructured (setup.py)
15+
backoff==2.2.1
16+
# via argilla
1117
certifi==2022.12.7
12-
# via requests
18+
# via
19+
# httpcore
20+
# httpx
21+
# requests
22+
# unstructured (setup.py)
1323
cffi==1.15.1
1424
# via cryptography
1525
charset-normalizer==3.0.1
1626
# via
1727
# pdfminer-six
1828
# requests
1929
click==8.1.3
20-
# via uvicorn
30+
# via
31+
# nltk
32+
# uvicorn
2133
contourpy==1.0.7
2234
# via matplotlib
2335
cryptography==39.0.0
2436
# via pdfminer-six
2537
cycler==0.11.0
2638
# via matplotlib
39+
deprecated==1.2.13
40+
# via argilla
2741
effdet==0.3.0
2842
# via layoutparser
43+
et-xmlfile==1.1.0
44+
# via openpyxl
2945
fastapi==0.89.1
3046
# via unstructured-inference
3147
filelock==3.9.0
3248
# via huggingface-hub
3349
fonttools==4.38.0
3450
# via matplotlib
3551
h11==0.14.0
36-
# via uvicorn
37-
huggingface-hub==0.11.1
52+
# via
53+
# httpcore
54+
# uvicorn
55+
httpcore==0.16.3
56+
# via httpx
57+
httpx==0.23.3
58+
# via argilla
59+
huggingface-hub==0.12.0
3860
# via
3961
# timm
4062
# unstructured-inference
4163
idna==3.4
4264
# via
4365
# anyio
4466
# requests
67+
# rfc3986
4568
iopath==0.1.10
4669
# via layoutparser
70+
joblib==1.2.0
71+
# via nltk
4772
kiwisolver==1.4.4
4873
# via matplotlib
4974
layoutparser[layoutmodels,tesseract]==0.3.4
5075
# via unstructured-inference
76+
lxml==4.9.2
77+
# via
78+
# python-docx
79+
# python-pptx
80+
# unstructured (setup.py)
5181
matplotlib==3.6.3
5282
# via pycocotools
53-
numpy==1.24.1
83+
monotonic==1.6
84+
# via argilla
85+
nltk==3.8.1
86+
# via unstructured (setup.py)
87+
numpy==1.23.5
5488
# via
89+
# argilla
5590
# contourpy
5691
# layoutparser
5792
# matplotlib
@@ -66,13 +101,19 @@ opencv-python==4.6.0.66
66101
# via
67102
# layoutparser
68103
# unstructured-inference
104+
openpyxl==3.0.10
105+
# via unstructured (setup.py)
69106
packaging==23.0
70107
# via
108+
# argilla
71109
# huggingface-hub
72110
# matplotlib
73111
# pytesseract
74112
pandas==1.5.3
75-
# via layoutparser
113+
# via
114+
# argilla
115+
# layoutparser
116+
# unstructured (setup.py)
76117
pdf2image==1.16.2
77118
# via layoutparser
78119
pdfminer-six==20221105
@@ -86,15 +127,19 @@ pillow==9.4.0
86127
# pdf2image
87128
# pdfplumber
88129
# pytesseract
130+
# python-pptx
89131
# torchvision
132+
# unstructured (setup.py)
90133
portalocker==2.7.0
91134
# via iopath
92135
pycocotools==2.0.6
93136
# via effdet
94137
pycparser==2.21
95138
# via cffi
96139
pydantic==1.10.4
97-
# via fastapi
140+
# via
141+
# argilla
142+
# fastapi
98143
pyparsing==3.0.9
99144
# via matplotlib
100145
pytesseract==0.3.10
@@ -103,8 +148,14 @@ python-dateutil==2.8.2
103148
# via
104149
# matplotlib
105150
# pandas
151+
python-docx==0.8.11
152+
# via unstructured (setup.py)
153+
python-magic==0.4.27
154+
# via unstructured (setup.py)
106155
python-multipart==0.0.5
107156
# via unstructured-inference
157+
python-pptx==0.6.21
158+
# via unstructured (setup.py)
108159
pytz==2022.7.1
109160
# via pandas
110161
pyyaml==6.0
@@ -113,18 +164,26 @@ pyyaml==6.0
113164
# layoutparser
114165
# omegaconf
115166
# timm
167+
regex==2022.10.31
168+
# via nltk
116169
requests==2.28.2
117170
# via
118171
# huggingface-hub
119172
# torchvision
173+
# unstructured (setup.py)
174+
rfc3986[idna2008]==1.5.0
175+
# via httpx
120176
scipy==1.10.0
121177
# via layoutparser
122178
six==1.16.0
123179
# via
124180
# python-dateutil
125181
# python-multipart
126182
sniffio==1.3.0
127-
# via anyio
183+
# via
184+
# anyio
185+
# httpcore
186+
# httpx
128187
starlette==0.22.0
129188
# via fastapi
130189
timm==0.6.12
@@ -142,8 +201,10 @@ torchvision==0.14.1
142201
# timm
143202
tqdm==4.64.1
144203
# via
204+
# argilla
145205
# huggingface-hub
146206
# iopath
207+
# nltk
147208
typing-extensions==4.4.0
148209
# via
149210
# huggingface-hub
@@ -152,11 +213,17 @@ typing-extensions==4.4.0
152213
# starlette
153214
# torch
154215
# torchvision
155-
unstructured-inference==0.2.3
156-
# via -r requirements/local-inference.in
216+
unstructured-inference==0.2.4
217+
# via unstructured (setup.py)
157218
urllib3==1.26.14
158219
# via requests
159220
uvicorn==0.20.0
160221
# via unstructured-inference
161222
wand==0.6.11
162223
# via pdfplumber
224+
wrapt==1.14.1
225+
# via
226+
# argilla
227+
# deprecated
228+
xlsxwriter==3.0.7
229+
# via python-pptx

setup.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -70,6 +70,6 @@
7070
"torch",
7171
"transformers",
7272
],
73-
"local-inference": ["unstructured-inference>=0.2.3"],
73+
"local-inference": ["unstructured-inference>=0.2.4"],
7474
},
7575
)

unstructured/__version__.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
__version__ = "0.4.4-dev3" # pragma: no cover
1+
__version__ = "0.4.4" # pragma: no cover

0 commit comments

Comments
 (0)