Skip to content

Commit 57f5a68

Browse files
ds-filipknefelFilip Knefelpawel-kmiecik
authored
chore(deps): bump unstructured to 0.13.2 (Unstructured-IO#402)
Bump `unstructured` dependency to 0.13.2 Test adjusted to reflect table extraction change introduced in unstructured 0.13.0 --------- Co-authored-by: Filip Knefel <[email protected]> Co-authored-by: Paweł Kmiecik <[email protected]>
1 parent 0ebc6c9 commit 57f5a68

File tree

4 files changed

+107
-113
lines changed

4 files changed

+107
-113
lines changed

CHANGELOG.md

Lines changed: 2 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -1,7 +1,8 @@
1-
## 0.0.66-dev1
1+
## 0.0.66-dev2
22

33
* Add support for `unique_element_ids` parameter.
44
* Add max lifetime, via MAX_LIFETIME_SECONDS env-var, to API containers
5+
* Bump unstructured to 0.13.2
56

67
## 0.0.65
78

requirements/base.txt

Lines changed: 37 additions & 43 deletions
Original file line numberDiff line numberDiff line change
@@ -19,7 +19,6 @@ beautifulsoup4==4.12.3
1919
certifi==2024.2.2
2020
# via
2121
# requests
22-
# unstructured
2322
# unstructured-client
2423
cffi==1.16.0
2524
# via cryptography
@@ -29,7 +28,6 @@ charset-normalizer==3.3.2
2928
# via
3029
# pdfminer-six
3130
# requests
32-
# unstructured
3331
# unstructured-client
3432
click==8.1.3
3533
# via
@@ -38,48 +36,46 @@ click==8.1.3
3836
# uvicorn
3937
coloredlogs==15.0.1
4038
# via onnxruntime
41-
contourpy==1.2.0
39+
contourpy==1.2.1
4240
# via matplotlib
4341
cryptography==42.0.5
4442
# via pdfminer-six
4543
cycler==0.12.1
4644
# via matplotlib
4745
dataclasses-json==0.6.4
48-
# via
49-
# unstructured
50-
# unstructured-client
51-
deepdiff==6.7.1
46+
# via unstructured
47+
dataclasses-json-speakeasy==0.5.11
5248
# via unstructured-client
5349
deprecated==1.2.14
5450
# via pikepdf
5551
effdet==0.4.1
5652
# via layoutparser
57-
emoji==2.10.1
53+
emoji==2.11.0
5854
# via unstructured
5955
et-xmlfile==1.1.0
6056
# via openpyxl
6157
exceptiongroup==1.2.0
6258
# via anyio
63-
fastapi==0.110.0
59+
fastapi==0.110.1
6460
# via -r requirements/base.in
65-
filelock==3.13.1
61+
filelock==3.13.4
6662
# via
6763
# huggingface-hub
6864
# torch
6965
# transformers
7066
filetype==1.2.0
7167
# via unstructured
72-
flatbuffers==24.3.7
68+
flatbuffers==24.3.25
7369
# via onnxruntime
74-
fonttools==4.49.0
70+
fonttools==4.51.0
7571
# via matplotlib
76-
fsspec==2024.2.0
72+
fsspec==2024.3.1
7773
# via
7874
# huggingface-hub
7975
# torch
8076
h11==0.14.0
8177
# via uvicorn
82-
huggingface-hub==0.21.4
78+
huggingface-hub==0.22.2
8379
# via
8480
# timm
8581
# tokenizers
@@ -96,7 +92,7 @@ iopath==0.1.10
9692
# via layoutparser
9793
jinja2==3.1.3
9894
# via torch
99-
joblib==1.3.2
95+
joblib==1.4.0
10096
# via nltk
10197
jsonpath-python==1.0.6
10298
# via unstructured-client
@@ -106,21 +102,22 @@ langdetect==1.0.9
106102
# via unstructured
107103
layoutparser[layoutmodels,tesseract]==0.3.4
108104
# via unstructured-inference
109-
lxml==5.1.0
105+
lxml==5.2.1
110106
# via
111107
# pikepdf
112108
# python-docx
113109
# python-pptx
114110
# unstructured
115-
markdown==3.5.2
111+
markdown==3.6
116112
# via unstructured
117113
markupsafe==2.1.5
118114
# via jinja2
119115
marshmallow==3.21.1
120116
# via
121117
# dataclasses-json
118+
# dataclasses-json-speakeasy
122119
# unstructured-client
123-
matplotlib==3.8.3
120+
matplotlib==3.8.4
124121
# via pycocotools
125122
mpmath==1.3.0
126123
# via sympy
@@ -130,7 +127,7 @@ mypy-extensions==1.0.0
130127
# via
131128
# typing-inspect
132129
# unstructured-client
133-
networkx==3.2.1
130+
networkx==3.3
134131
# via
135132
# torch
136133
# unstructured
@@ -154,7 +151,7 @@ olefile==0.47
154151
# via msg-parser
155152
omegaconf==2.3.0
156153
# via effdet
157-
onnx==1.15.0
154+
onnx==1.16.0
158155
# via
159156
# unstructured
160157
# unstructured-inference
@@ -166,8 +163,6 @@ opencv-python==4.9.0.80
166163
# unstructured-inference
167164
openpyxl==3.1.2
168165
# via unstructured
169-
ordered-set==4.1.0
170-
# via deepdiff
171166
packaging==24.0
172167
# via
173168
# huggingface-hub
@@ -193,9 +188,9 @@ pdfminer-six==20231228
193188
# unstructured
194189
pdfplumber==0.11.0
195190
# via layoutparser
196-
pikepdf==8.13.0
191+
pikepdf==8.15.0
197192
# via unstructured
198-
pillow==10.2.0
193+
pillow==10.3.0
199194
# via
200195
# layoutparser
201196
# matplotlib
@@ -207,19 +202,19 @@ pillow==10.2.0
207202
# python-pptx
208203
# torchvision
209204
# unstructured-pytesseract
210-
pillow-heif==0.15.0
205+
pillow-heif==0.16.0
211206
# via unstructured
212207
portalocker==2.8.2
213208
# via iopath
214-
protobuf==4.25.3
209+
protobuf==5.26.1
215210
# via
216211
# onnx
217212
# onnxruntime
218213
psutil==5.9.8
219214
# via -r requirements/base.in
220215
pycocotools==2.0.7
221216
# via effdet
222-
pycparser==2.21
217+
pycparser==2.22
223218
# via cffi
224219
pycryptodome==3.20.0
225220
# via -r requirements/base.in
@@ -231,12 +226,11 @@ pypandoc==1.13
231226
# via unstructured
232227
pyparsing==3.1.2
233228
# via matplotlib
234-
pypdf==4.1.0
229+
pypdf==4.2.0
235230
# via
236231
# -r requirements/base.in
237232
# unstructured
238-
# unstructured-client
239-
pypdfium2==4.28.0
233+
pypdfium2==4.29.0
240234
# via pdfplumber
241235
pytesseract==0.3.10
242236
# via layoutparser
@@ -264,7 +258,7 @@ pyyaml==6.0.1
264258
# omegaconf
265259
# timm
266260
# transformers
267-
rapidfuzz==3.6.2
261+
rapidfuzz==3.8.1
268262
# via
269263
# unstructured
270264
# unstructured-inference
@@ -286,7 +280,7 @@ safetensors==0.3.2
286280
# -c requirements/constraints.in
287281
# timm
288282
# transformers
289-
scipy==1.12.0
283+
scipy==1.13.0
290284
# via layoutparser
291285
six==1.16.0
292286
# via
@@ -297,7 +291,7 @@ sniffio==1.3.1
297291
# via anyio
298292
soupsieve==2.5
299293
# via beautifulsoup4
300-
starlette==0.36.3
294+
starlette==0.37.2
301295
# via fastapi
302296
sympy==1.12
303297
# via
@@ -309,13 +303,13 @@ timm==0.9.16
309303
# via effdet
310304
tokenizers==0.15.2
311305
# via transformers
312-
torch==2.2.1
306+
torch==2.2.2
313307
# via
314308
# effdet
315309
# layoutparser
316310
# timm
317311
# torchvision
318-
torchvision==0.17.1
312+
torchvision==0.17.2
319313
# via
320314
# effdet
321315
# layoutparser
@@ -328,14 +322,15 @@ tqdm==4.66.2
328322
# transformers
329323
transformers==4.37.1
330324
# via unstructured-inference
331-
typing-extensions==4.10.0
325+
typing-extensions==4.11.0
332326
# via
333327
# anyio
334328
# fastapi
335329
# huggingface-hub
336330
# iopath
337331
# pydantic
338332
# pydantic-core
333+
# pypdf
339334
# python-docx
340335
# torch
341336
# typing-inspect
@@ -345,24 +340,23 @@ typing-extensions==4.10.0
345340
typing-inspect==0.9.0
346341
# via
347342
# dataclasses-json
343+
# dataclasses-json-speakeasy
348344
# unstructured-client
349345
tzdata==2024.1
350346
# via pandas
351-
unstructured[local-inference]==0.12.5
352-
# via
353-
# -r requirements/base.in
354-
# unstructured
355-
unstructured-client==0.21.1
347+
unstructured[local-inference]==0.13.2
348+
# via -r requirements/base.in
349+
unstructured-client==0.18.0
356350
# via unstructured
357-
unstructured-inference==0.7.23
351+
unstructured-inference==0.7.25
358352
# via unstructured
359353
unstructured-pytesseract==0.3.12
360354
# via unstructured
361355
urllib3==2.2.1
362356
# via
363357
# requests
364358
# unstructured-client
365-
uvicorn==0.28.0
359+
uvicorn==0.29.0
366360
# via -r requirements/base.in
367361
wrapt==1.16.0
368362
# via

0 commit comments

Comments
 (0)