Skip to content

Commit 1a94d95

Browse files
authored
chore: dependency bumps, release commit for 0.16.12 (#3831)
1 parent e2d0280 commit 1a94d95

File tree

12 files changed

+47
-47
lines changed

12 files changed

+47
-47
lines changed

CHANGELOG.md

+3-3
Original file line numberDiff line numberDiff line change
@@ -1,15 +1,15 @@
1-
## 0.16.12-dev5
1+
## 0.16.12
22

33
### Enhancements
44

55
- **Prepare auto-partitioning for pluggable partitioners**. Move toward a uniform partitioner call signature so a custom or override partitioner can be registered without code changes.
6-
- **Add NDJSON file type support**
6+
- **Add NDJSON file type support.**
77

88
### Features
99

1010
### Fixes
1111

12-
- Base image has been updated, trigger new workflows
12+
- **Base image has been updated.**
1313
- **Upgrade ruff to latest.** Previously the ruff version was pinned to <0.5. Remove that pin and fix the handful of lint items that resulted.
1414
- **CSV with asserted XLS content-type is correctly identified as CSV.** Resolves a bug where a CSV file with an asserted content-type of `application/vnd.ms-excel` was incorrectly identified as an XLS file.
1515
- **Improve element-type mapping for Chinese text.** Fixes bug where Chinese text would produce large numbers of false-positive `Title` elements.

requirements/base.txt

+4-4
Original file line numberDiff line numberDiff line change
@@ -20,11 +20,11 @@ cffi==1.17.1
2020
# via cryptography
2121
chardet==5.2.0
2222
# via -r ./base.in
23-
charset-normalizer==3.4.0
23+
charset-normalizer==3.4.1
2424
# via
2525
# requests
2626
# unstructured-client
27-
click==8.1.7
27+
click==8.1.8
2828
# via
2929
# nltk
3030
# python-oxmsg
@@ -64,7 +64,7 @@ langdetect==1.0.9
6464
# via -r ./base.in
6565
lxml==5.3.0
6666
# via -r ./base.in
67-
marshmallow==3.23.1
67+
marshmallow==3.23.2
6868
# via
6969
# dataclasses-json
7070
# unstructured-client
@@ -88,7 +88,7 @@ packaging==24.2
8888
# via
8989
# marshmallow
9090
# unstructured-client
91-
psutil==6.1.0
91+
psutil==6.1.1
9292
# via -r ./base.in
9393
pycparser==2.22
9494
# via cffi

requirements/dev.txt

+3-3
Original file line numberDiff line numberDiff line change
@@ -8,7 +8,7 @@ build==1.2.2.post1
88
# via pip-tools
99
cfgv==3.4.0
1010
# via pre-commit
11-
click==8.1.7
11+
click==8.1.8
1212
# via
1313
# -c ./base.txt
1414
# -c ./test.txt
@@ -17,7 +17,7 @@ distlib==0.3.9
1717
# via virtualenv
1818
filelock==3.16.1
1919
# via virtualenv
20-
identify==2.6.3
20+
identify==2.6.4
2121
# via pre-commit
2222
importlib-metadata==8.5.0
2323
# via
@@ -51,7 +51,7 @@ tomli==2.2.1
5151
# -c ./test.txt
5252
# build
5353
# pip-tools
54-
virtualenv==20.28.0
54+
virtualenv==20.28.1
5555
# via pre-commit
5656
wheel==0.45.1
5757
# via pip-tools

requirements/extra-paddleocr.txt

+4-4
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@ certifi==2024.12.14
1616
# httpcore
1717
# httpx
1818
# requests
19-
charset-normalizer==3.4.0
19+
charset-normalizer==3.4.1
2020
# via
2121
# -c ./base.txt
2222
# requests
@@ -58,7 +58,7 @@ imageio==2.36.1
5858
# scikit-image
5959
imgaug==0.4.0
6060
# via unstructured-paddleocr
61-
importlib-resources==6.4.5
61+
importlib-resources==6.5.1
6262
# via matplotlib
6363
kiwisolver==1.4.7
6464
# via matplotlib
@@ -104,7 +104,7 @@ paddlepaddle==3.0.0b1
104104
# via -r ./extra-paddleocr.in
105105
pdf2image==1.17.0
106106
# via unstructured-paddleocr
107-
pillow==11.0.0
107+
pillow==11.1.0
108108
# via
109109
# imageio
110110
# imgaug
@@ -119,7 +119,7 @@ protobuf==4.25.5
119119
# paddlepaddle
120120
pyclipper==1.3.0.post6
121121
# via unstructured-paddleocr
122-
pyparsing==3.2.0
122+
pyparsing==3.2.1
123123
# via matplotlib
124124
python-dateutil==2.9.0.post0
125125
# via

requirements/extra-pdf-image.txt

+12-12
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,7 @@ cffi==1.17.1
1616
# via
1717
# -c ./base.txt
1818
# cryptography
19-
charset-normalizer==3.4.0
19+
charset-normalizer==3.4.1
2020
# via
2121
# -c ./base.txt
2222
# pdfminer-six
@@ -40,11 +40,11 @@ filelock==3.16.1
4040
# huggingface-hub
4141
# torch
4242
# transformers
43-
flatbuffers==24.3.25
43+
flatbuffers==24.12.23
4444
# via onnxruntime
4545
fonttools==4.55.3
4646
# via matplotlib
47-
fsspec==2024.10.0
47+
fsspec==2024.12.0
4848
# via
4949
# huggingface-hub
5050
# torch
@@ -79,11 +79,11 @@ idna==3.10
7979
# via
8080
# -c ./base.txt
8181
# requests
82-
importlib-resources==6.4.5
82+
importlib-resources==6.5.1
8383
# via matplotlib
8484
iopath==0.1.10
8585
# via layoutparser
86-
jinja2==3.1.4
86+
jinja2==3.1.5
8787
# via torch
8888
kiwisolver==1.4.7
8989
# via matplotlib
@@ -149,13 +149,13 @@ pdfminer-six==20231228
149149
# via
150150
# -r ./extra-pdf-image.in
151151
# pdfplumber
152-
pdfplumber==0.11.4
152+
pdfplumber==0.11.5
153153
# via layoutparser
154154
pi-heif==0.21.0
155155
# via -r ./extra-pdf-image.in
156-
pikepdf==9.4.2
156+
pikepdf==9.5.0
157157
# via -r ./extra-pdf-image.in
158-
pillow==11.0.0
158+
pillow==11.1.0
159159
# via
160160
# layoutparser
161161
# matplotlib
@@ -165,7 +165,7 @@ pillow==11.0.0
165165
# pikepdf
166166
# torchvision
167167
# unstructured-pytesseract
168-
portalocker==3.0.0
168+
portalocker==3.1.1
169169
# via iopath
170170
proto-plus==1.25.0
171171
# via
@@ -193,13 +193,13 @@ pycparser==2.22
193193
# via
194194
# -c ./base.txt
195195
# cffi
196-
pyparsing==3.2.0
196+
pyparsing==3.2.1
197197
# via matplotlib
198198
pypdf==5.1.0
199199
# via
200200
# -c ./base.txt
201201
# -r ./extra-pdf-image.in
202-
pypdfium2==4.30.0
202+
pypdfium2==4.30.1
203203
# via pdfplumber
204204
python-dateutil==2.9.0.post0
205205
# via
@@ -233,7 +233,7 @@ requests==2.32.3
233233
# transformers
234234
rsa==4.9
235235
# via google-auth
236-
safetensors==0.4.5
236+
safetensors==0.5.0
237237
# via
238238
# timm
239239
# transformers

requirements/extra-pptx.txt

+1-1
Original file line numberDiff line numberDiff line change
@@ -6,7 +6,7 @@
66
#
77
lxml==5.3.0
88
# via python-pptx
9-
pillow==11.0.0
9+
pillow==11.1.0
1010
# via python-pptx
1111
python-pptx==1.0.2
1212
# via -r ./extra-pptx.in

requirements/huggingface.txt

+5-5
Original file line numberDiff line numberDiff line change
@@ -8,11 +8,11 @@ certifi==2024.12.14
88
# via
99
# -c ./base.txt
1010
# requests
11-
charset-normalizer==3.4.0
11+
charset-normalizer==3.4.1
1212
# via
1313
# -c ./base.txt
1414
# requests
15-
click==8.1.7
15+
click==8.1.8
1616
# via
1717
# -c ./base.txt
1818
# sacremoses
@@ -21,7 +21,7 @@ filelock==3.16.1
2121
# huggingface-hub
2222
# torch
2323
# transformers
24-
fsspec==2024.10.0
24+
fsspec==2024.12.0
2525
# via
2626
# huggingface-hub
2727
# torch
@@ -33,7 +33,7 @@ idna==3.10
3333
# via
3434
# -c ./base.txt
3535
# requests
36-
jinja2==3.1.4
36+
jinja2==3.1.5
3737
# via torch
3838
joblib==1.4.2
3939
# via
@@ -74,7 +74,7 @@ requests==2.32.3
7474
# transformers
7575
sacremoses==0.1.1
7676
# via -r ./huggingface.in
77-
safetensors==0.4.5
77+
safetensors==0.5.0
7878
# via transformers
7979
sentencepiece==0.2.0
8080
# via -r ./huggingface.in

requirements/test.txt

+11-11
Original file line numberDiff line numberDiff line change
@@ -12,7 +12,7 @@ anyio==4.7.0
1212
# httpx
1313
appdirs==1.4.4
1414
# via label-studio-sdk
15-
argcomplete==3.5.2
15+
argcomplete==3.5.3
1616
# via datamodel-code-generator
1717
attrs==24.3.0
1818
# via
@@ -30,16 +30,16 @@ certifi==2024.12.14
3030
# httpcore
3131
# httpx
3232
# requests
33-
charset-normalizer==3.4.0
33+
charset-normalizer==3.4.1
3434
# via
3535
# -c ./base.txt
3636
# requests
37-
click==8.1.7
37+
click==8.1.8
3838
# via
3939
# -c ./base.txt
4040
# black
4141
# nltk
42-
coverage[toml]==7.6.9
42+
coverage[toml]==7.6.10
4343
# via
4444
# -r ./test.in
4545
# pytest-cov
@@ -98,7 +98,7 @@ iniconfig==2.0.0
9898
# via pytest
9999
isort==5.13.2
100100
# via datamodel-code-generator
101-
jinja2==3.1.4
101+
jinja2==3.1.5
102102
# via datamodel-code-generator
103103
joblib==1.4.2
104104
# via
@@ -126,7 +126,7 @@ mccabe==0.7.0
126126
# via flake8
127127
multidict==6.1.0
128128
# via yarl
129-
mypy==1.13.0
129+
mypy==1.14.1
130130
# via -r ./test.in
131131
mypy-extensions==1.0.0
132132
# via
@@ -152,7 +152,7 @@ pandas==2.2.3
152152
# via label-studio-sdk
153153
pathspec==0.12.1
154154
# via black
155-
pillow==11.0.0
155+
pillow==11.1.0
156156
# via label-studio-sdk
157157
platformdirs==4.3.6
158158
# via black
@@ -164,13 +164,13 @@ pycodestyle==2.12.1
164164
# via
165165
# flake8
166166
# flake8-print
167-
pydantic[email]==2.10.3
167+
pydantic[email]==2.10.4
168168
# via
169169
# -r ./test.in
170170
# datamodel-code-generator
171171
# jsf
172172
# label-studio-sdk
173-
pydantic-core==2.27.1
173+
pydantic-core==2.27.2
174174
# via pydantic
175175
pyflakes==3.2.0
176176
# via
@@ -218,7 +218,7 @@ rpds-py==0.22.3
218218
# referencing
219219
rstr==3.2.2
220220
# via jsf
221-
ruff==0.8.3
221+
ruff==0.8.5
222222
# via -r ./test.in
223223
semantic-version==2.10.0
224224
# via liccheck
@@ -279,7 +279,7 @@ urllib3==1.26.20
279279
# -c ./base.txt
280280
# requests
281281
# vcrpy
282-
vcrpy==6.0.2
282+
vcrpy==7.0.0
283283
# via -r ./test.in
284284
wrapt==1.17.0
285285
# via

test_unstructured_ingest/expected-structured-output/outlook/21be155fb0c95885.eml.json

+1-1
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@
2626
},
2727
"date_created": "1689435368.0",
2828
"date_modified": "1689435537.0",
29-
"filesize_bytes": 9189
29+
"filesize_bytes": 9179
3030
}
3131
}
3232
}

test_unstructured_ingest/expected-structured-output/outlook/497eba8c81c801c6.eml.json

+1-1
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@
2626
},
2727
"date_created": "1690248382.0",
2828
"date_modified": "1690248401.0",
29-
"filesize_bytes": 9207
29+
"filesize_bytes": 9197
3030
}
3131
}
3232
}

test_unstructured_ingest/expected-structured-output/outlook/4a16a411f162ebbb.eml.json

+1-1
Original file line numberDiff line numberDiff line change
@@ -26,7 +26,7 @@
2626
},
2727
"date_created": "1688960344.0",
2828
"date_modified": "1689460572.0",
29-
"filesize_bytes": 9254
29+
"filesize_bytes": 9244
3030
}
3131
}
3232
}

unstructured/__version__.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -1 +1 @@
1-
__version__ = "0.16.12-dev5" # pragma: no cover
1+
__version__ = "0.16.12" # pragma: no cover

0 commit comments

Comments
 (0)