chore: dependency updates to resolve cves (#4124)

<!-- CURSOR_SUMMARY -->
> [!NOTE]
> Release 0.18.21 with broad dependency pin updates across requirements
(notably unstructured-inference 1.1.2) to remediate CVEs.
> 
> - **Release**
>   - Set version to `0.18.21` and update `CHANGELOG.md`.
> - **Dependencies**
> - Upgrade `unstructured-inference` to `1.1.2` in
`requirements/extra-pdf-image.txt` to address CVEs.
> - Refresh pins across `requirements/*.txt` (base, dev, test, and
extras), including updates like `certifi`, `click`, `pypdf`, `pypandoc`,
`paddlepaddle`, `torch`/`torchvision`, `google-auth` stack, `protobuf`,
`safetensors`, etc.; normalize pip-compile headers and constraint paths.
> 
> <sup>Written by [Cursor
Bugbot](https://cursor.com/dashboard?tab=bugbot) for commit
face075955f8b733f28e17cd26863470b4622def. This will update automatically
on new commits. Configure
[here](https://cursor.com/dashboard?tab=bugbot).</sup>
<!-- /CURSOR_SUMMARY -->
This commit is contained in:
Lawrence Elitzer (LoLo) 2025-11-21 16:16:43 -06:00 committed by GitHub
parent 6c1bbb379c
commit 91a9888d35
No known key found for this signature in database
GPG Key ID: B5690EEEBB952194
16 changed files with 221 additions and 220 deletions

View File

@ -1,4 +1,4 @@
## 0.18.21-dev0 ## 0.18.21
### Enhancement ### Enhancement
- Update save_elements unit test to check crop box padding behavior - Update save_elements unit test to check crop box padding behavior
@ -6,6 +6,7 @@
### Features ### Features
### Fixes ### Fixes
- **Update `unstructured-inference`** to 1.1.2 to address CVEs
## 0.18.20 ## 0.18.20

View File

@ -2,15 +2,15 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./base.in # pip-compile --no-strip-extras ./base.in
# #
anyio==4.11.0 anyio==4.11.0
# via httpx # via httpx
backoff==2.2.1 backoff==2.2.1
# via -r ./base.in # via -r base.in
beautifulsoup4==4.14.2 beautifulsoup4==4.14.2
# via -r ./base.in # via -r base.in
certifi==2025.10.5 certifi==2025.11.12
# via # via
# httpcore # httpcore
# httpx # httpx
@ -20,10 +20,10 @@ cffi==2.0.0
# via cryptography # via cryptography
charset-normalizer==3.4.4 charset-normalizer==3.4.4
# via # via
# -r ./base.in # -r base.in
# requests # requests
# unstructured-client # unstructured-client
click==8.3.0 click==8.3.1
# via # via
# nltk # nltk
# python-oxmsg # python-oxmsg
@ -31,20 +31,20 @@ cryptography==46.0.3
# via unstructured-client # via unstructured-client
dataclasses-json==0.6.7 dataclasses-json==0.6.7
# via # via
# -r ./base.in # -r base.in
# unstructured-client # unstructured-client
deepdiff==8.6.1 deepdiff==8.6.1
# via unstructured-client # via unstructured-client
emoji==2.15.0 emoji==2.15.0
# via -r ./base.in # via -r base.in
exceptiongroup==1.3.0 exceptiongroup==1.3.0
# via anyio # via anyio
filetype==1.2.0 filetype==1.2.0
# via -r ./base.in # via -r base.in
h11==0.16.0 h11==0.16.0
# via httpcore # via httpcore
html5lib==1.1 html5lib==1.1
# via -r ./base.in # via -r base.in
httpcore==1.0.9 httpcore==1.0.9
# via httpx # via httpx
httpx==0.28.1 httpx==0.28.1
@ -60,9 +60,9 @@ joblib==1.5.2
jsonpath-python==1.0.6 jsonpath-python==1.0.6
# via unstructured-client # via unstructured-client
langdetect==1.0.9 langdetect==1.0.9
# via -r ./base.in # via -r base.in
lxml==6.0.2 lxml==6.0.2
# via -r ./base.in # via -r base.in
marshmallow==3.26.1 marshmallow==3.26.1
# via # via
# dataclasses-json # dataclasses-json
@ -74,9 +74,9 @@ mypy-extensions==1.1.0
nest-asyncio==1.6.0 nest-asyncio==1.6.0
# via unstructured-client # via unstructured-client
nltk==3.9.2 nltk==3.9.2
# via -r ./base.in # via -r base.in
numpy==2.2.6 numpy==2.2.6
# via -r ./base.in # via -r base.in
olefile==0.47 olefile==0.47
# via python-oxmsg # via python-oxmsg
orderly-set==5.5.0 orderly-set==5.5.0
@ -86,26 +86,26 @@ packaging==25.0
# marshmallow # marshmallow
# unstructured-client # unstructured-client
psutil==7.1.3 psutil==7.1.3
# via -r ./base.in # via -r base.in
pycparser==2.23 pycparser==2.23
# via cffi # via cffi
pypdf==6.1.3 pypdf==6.3.0
# via unstructured-client # via unstructured-client
python-dateutil==2.9.0.post0 python-dateutil==2.9.0.post0
# via unstructured-client # via unstructured-client
python-iso639==2025.2.18 python-iso639==2025.11.16
# via -r ./base.in # via -r base.in
python-magic==0.4.27 python-magic==0.4.27
# via -r ./base.in # via -r base.in
python-oxmsg==0.0.2 python-oxmsg==0.0.2
# via -r ./base.in # via -r base.in
rapidfuzz==3.14.3 rapidfuzz==3.14.3
# via -r ./base.in # via -r base.in
regex==2025.11.3 regex==2025.11.3
# via nltk # via nltk
requests==2.32.5 requests==2.32.5
# via # via
# -r ./base.in # -r base.in
# requests-toolbelt # requests-toolbelt
# unstructured-client # unstructured-client
requests-toolbelt==1.0.0 requests-toolbelt==1.0.0
@ -122,11 +122,11 @@ soupsieve==2.8
# via beautifulsoup4 # via beautifulsoup4
tqdm==4.67.1 tqdm==4.67.1
# via # via
# -r ./base.in # -r base.in
# nltk # nltk
typing-extensions==4.15.0 typing-extensions==4.15.0
# via # via
# -r ./base.in # -r base.in
# anyio # anyio
# beautifulsoup4 # beautifulsoup4
# cryptography # cryptography
@ -141,14 +141,14 @@ typing-inspect==0.9.0
# unstructured-client # unstructured-client
unstructured-client==0.25.9 unstructured-client==0.25.9
# via # via
# -c /Users/luke/git/unstructured/requirements/deps/constraints.txt # -c deps/constraints.txt
# -r ./base.in # -r base.in
urllib3==2.5.0 urllib3==2.5.0
# via # via
# -c /Users/luke/git/unstructured/requirements/deps/constraints.txt # -c deps/constraints.txt
# requests # requests
# unstructured-client # unstructured-client
webencodings==0.5.1 webencodings==0.5.1
# via html5lib # via html5lib
wrapt==2.0.0 wrapt==2.0.1
# via -r ./base.in # via -r base.in

View File

@ -2,16 +2,16 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./dev.in # pip-compile --no-strip-extras ./dev.in
# #
build==1.3.0 build==1.3.0
# via pip-tools # via pip-tools
cfgv==3.4.0 cfgv==3.5.0
# via pre-commit # via pre-commit
click==8.3.0 click==8.3.1
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# -c /Users/luke/git/unstructured/requirements/test.txt # -c test.txt
# pip-tools # pip-tools
distlib==0.4.0 distlib==0.4.0
# via virtualenv # via virtualenv
@ -23,17 +23,17 @@ nodeenv==1.9.1
# via pre-commit # via pre-commit
packaging==25.0 packaging==25.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# -c /Users/luke/git/unstructured/requirements/test.txt # -c test.txt
# build # build
pip-tools==7.5.1 pip-tools==7.5.2
# via -r ./dev.in # via -r dev.in
platformdirs==4.5.0 platformdirs==4.5.0
# via # via
# -c /Users/luke/git/unstructured/requirements/test.txt # -c test.txt
# virtualenv # virtualenv
pre-commit==4.3.0 pre-commit==4.4.0
# via -r ./dev.in # via -r dev.in
pyproject-hooks==1.2.0 pyproject-hooks==1.2.0
# via # via
# build # build
@ -42,13 +42,13 @@ pyyaml==6.0.3
# via pre-commit # via pre-commit
tomli==2.3.0 tomli==2.3.0
# via # via
# -c /Users/luke/git/unstructured/requirements/test.txt # -c test.txt
# build # build
# pip-tools # pip-tools
typing-extensions==4.15.0 typing-extensions==4.15.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# -c /Users/luke/git/unstructured/requirements/test.txt # -c test.txt
# virtualenv # virtualenv
virtualenv==20.35.4 virtualenv==20.35.4
# via pre-commit # via pre-commit

View File

@ -2,23 +2,23 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./extra-csv.in # pip-compile --no-strip-extras ./extra-csv.in
# #
numpy==2.2.6 numpy==2.2.6
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# pandas # pandas
pandas==2.3.3 pandas==2.3.3
# via -r ./extra-csv.in # via -r extra-csv.in
python-dateutil==2.9.0.post0 python-dateutil==2.9.0.post0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# pandas # pandas
pytz==2025.2 pytz==2025.2
# via pandas # via pandas
six==1.17.0 six==1.17.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# python-dateutil # python-dateutil
tzdata==2025.2 tzdata==2025.2
# via pandas # via pandas

View File

@ -2,15 +2,15 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./extra-docx.in # pip-compile --no-strip-extras ./extra-docx.in
# #
lxml==6.0.2 lxml==6.0.2
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# python-docx # python-docx
python-docx==1.2.0 python-docx==1.2.0
# via -r ./extra-docx.in # via -r extra-docx.in
typing-extensions==4.15.0 typing-extensions==4.15.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# python-docx # python-docx

View File

@ -2,7 +2,7 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./extra-epub.in # pip-compile --no-strip-extras ./extra-epub.in
# #
pypandoc==1.15 pypandoc==1.16.2
# via -r ./extra-epub.in # via -r extra-epub.in

View File

@ -2,7 +2,7 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./extra-markdown.in # pip-compile --no-strip-extras ./extra-markdown.in
# #
markdown==3.10 markdown==3.10
# via -r ./extra-markdown.in # via -r extra-markdown.in

View File

@ -2,17 +2,17 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./extra-odt.in # pip-compile --no-strip-extras ./extra-odt.in
# #
lxml==6.0.2 lxml==6.0.2
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# python-docx # python-docx
pypandoc==1.15 pypandoc==1.16.2
# via -r ./extra-odt.in # via -r extra-odt.in
python-docx==1.2.0 python-docx==1.2.0
# via -r ./extra-odt.in # via -r extra-odt.in
typing-extensions==4.15.0 typing-extensions==4.15.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# python-docx # python-docx

View File

@ -2,7 +2,7 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./extra-paddleocr.in # pip-compile --no-strip-extras ./extra-paddleocr.in
# #
albucore==0.0.24 albucore==0.0.24
# via # via
@ -14,27 +14,27 @@ annotated-types==0.7.0
# via pydantic # via pydantic
anyio==4.11.0 anyio==4.11.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# httpx # httpx
beautifulsoup4==4.14.2 beautifulsoup4==4.14.2
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# unstructured-paddleocr # unstructured-paddleocr
certifi==2025.10.5 certifi==2025.11.12
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# httpcore # httpcore
# httpx # httpx
# requests # requests
charset-normalizer==3.4.4 charset-normalizer==3.4.4
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# requests # requests
cython==3.2.0 cython==3.2.1
# via unstructured-paddleocr # via unstructured-paddleocr
exceptiongroup==1.3.0 exceptiongroup==1.3.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# anyio # anyio
fire==0.7.1 fire==0.7.1
# via unstructured-paddleocr # via unstructured-paddleocr
@ -42,19 +42,19 @@ fonttools==4.60.1
# via unstructured-paddleocr # via unstructured-paddleocr
h11==0.16.0 h11==0.16.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# httpcore # httpcore
httpcore==1.0.9 httpcore==1.0.9
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# httpx # httpx
httpx==0.28.1 httpx==0.28.1
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# paddlepaddle # paddlepaddle
idna==3.11 idna==3.11
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# anyio # anyio
# httpx # httpx
# requests # requests
@ -64,7 +64,7 @@ lazy-loader==0.4
# via scikit-image # via scikit-image
lxml==6.0.2 lxml==6.0.2
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# python-docx # python-docx
networkx==3.4.2 networkx==3.4.2
# via # via
@ -72,7 +72,7 @@ networkx==3.4.2
# scikit-image # scikit-image
numpy==2.2.6 numpy==2.2.6
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# albucore # albucore
# albumentations # albumentations
# imageio # imageio
@ -98,20 +98,20 @@ opt-einsum==3.3.0
# via paddlepaddle # via paddlepaddle
packaging==25.0 packaging==25.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# lazy-loader # lazy-loader
# scikit-image # scikit-image
paddlepaddle==3.2.1 paddlepaddle==3.2.2
# via -r ./extra-paddleocr.in # via -r extra-paddleocr.in
pillow==12.0.0 pillow==12.0.0
# via # via
# imageio # imageio
# paddlepaddle # paddlepaddle
# scikit-image # scikit-image
# unstructured-paddleocr # unstructured-paddleocr
protobuf==6.33.0 protobuf==6.33.1
# via # via
# -c /Users/luke/git/unstructured/requirements/deps/constraints.txt # -c deps/constraints.txt
# paddlepaddle # paddlepaddle
pyclipper==1.3.0.post6 pyclipper==1.3.0.post6
# via unstructured-paddleocr # via unstructured-paddleocr
@ -127,13 +127,13 @@ pyyaml==6.0.3
# unstructured-paddleocr # unstructured-paddleocr
rapidfuzz==3.14.3 rapidfuzz==3.14.3
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# unstructured-paddleocr # unstructured-paddleocr
requests==2.32.5 requests==2.32.5
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# unstructured-paddleocr # unstructured-paddleocr
safetensors==0.6.2 safetensors==0.7.0
# via paddlepaddle # via paddlepaddle
scikit-image==0.25.2 scikit-image==0.25.2
# via unstructured-paddleocr # via unstructured-paddleocr
@ -147,11 +147,11 @@ simsimd==6.5.3
# via albucore # via albucore
sniffio==1.3.1 sniffio==1.3.1
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# anyio # anyio
soupsieve==2.8 soupsieve==2.8
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# beautifulsoup4 # beautifulsoup4
stringzilla==4.2.3 stringzilla==4.2.3
# via albucore # via albucore
@ -161,11 +161,11 @@ tifffile==2025.5.10
# via scikit-image # via scikit-image
tqdm==4.67.1 tqdm==4.67.1
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# unstructured-paddleocr # unstructured-paddleocr
typing-extensions==4.15.0 typing-extensions==4.15.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# anyio # anyio
# beautifulsoup4 # beautifulsoup4
# exceptiongroup # exceptiongroup
@ -177,9 +177,9 @@ typing-extensions==4.15.0
typing-inspection==0.4.2 typing-inspection==0.4.2
# via pydantic # via pydantic
unstructured-paddleocr==2.10.0 unstructured-paddleocr==2.10.0
# via -r ./extra-paddleocr.in # via -r extra-paddleocr.in
urllib3==2.5.0 urllib3==2.5.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# -c /Users/luke/git/unstructured/requirements/deps/constraints.txt # -c deps/constraints.txt
# requests # requests

View File

@ -2,7 +2,7 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./extra-pandoc.in # pip-compile --no-strip-extras ./extra-pandoc.in
# #
pypandoc==1.15 pypandoc==1.16.2
# via -r ./extra-pandoc.in # via -r extra-pandoc.in

View File

@ -2,25 +2,25 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./extra-pdf-image.in # pip-compile --no-strip-extras ./extra-pdf-image.in
# #
accelerate==1.11.0 accelerate==1.12.0
# via unstructured-inference # via unstructured-inference
antlr4-python3-runtime==4.9.3 antlr4-python3-runtime==4.9.3
# via omegaconf # via omegaconf
cachetools==6.2.1 cachetools==6.2.2
# via google-auth # via google-auth
certifi==2025.10.5 certifi==2025.11.12
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# requests # requests
cffi==2.0.0 cffi==2.0.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# cryptography # cryptography
charset-normalizer==3.4.4 charset-normalizer==3.4.4
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# pdfminer-six # pdfminer-six
# requests # requests
coloredlogs==15.0.1 coloredlogs==15.0.1
@ -29,14 +29,14 @@ contourpy==1.3.2
# via matplotlib # via matplotlib
cryptography==46.0.3 cryptography==46.0.3
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# pdfminer-six # pdfminer-six
cycler==0.12.1 cycler==0.12.1
# via matplotlib # via matplotlib
deprecated==1.3.1 deprecated==1.3.1
# via pikepdf # via pikepdf
effdet==0.4.1 effdet==0.4.1
# via -r ./extra-pdf-image.in # via -r extra-pdf-image.in
filelock==3.20.0 filelock==3.20.0
# via # via
# huggingface-hub # huggingface-hub
@ -52,13 +52,13 @@ fsspec==2025.10.0
# torch # torch
google-api-core[grpc]==2.28.1 google-api-core[grpc]==2.28.1
# via google-cloud-vision # via google-cloud-vision
google-auth==2.42.1 google-auth==2.43.0
# via # via
# google-api-core # google-api-core
# google-cloud-vision # google-cloud-vision
google-cloud-vision==3.11.0 google-cloud-vision==3.11.0
# via -r ./extra-pdf-image.in # via -r extra-pdf-image.in
googleapis-common-protos==1.71.0 googleapis-common-protos==1.72.0
# via # via
# google-api-core # google-api-core
# grpcio-status # grpcio-status
@ -82,7 +82,7 @@ humanfriendly==10.0
# via coloredlogs # via coloredlogs
idna==3.11 idna==3.11
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# requests # requests
jinja2==3.1.6 jinja2==3.1.6
# via torch # via torch
@ -90,13 +90,13 @@ kiwisolver==1.4.9
# via matplotlib # via matplotlib
lxml==6.0.2 lxml==6.0.2
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# pikepdf # pikepdf
markupsafe==3.0.3 markupsafe==3.0.3
# via jinja2 # via jinja2
matplotlib==3.10.7 matplotlib==3.10.7
# via unstructured-inference # via unstructured-inference
ml-dtypes==0.5.3 ml-dtypes==0.5.4
# via onnx # via onnx
mpmath==1.3.0 mpmath==1.3.0
# via sympy # via sympy
@ -104,7 +104,7 @@ networkx==3.4.2
# via torch # via torch
numpy==2.2.6 numpy==2.2.6
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# accelerate # accelerate
# contourpy # contourpy
# matplotlib # matplotlib
@ -122,17 +122,17 @@ omegaconf==2.3.0
# via effdet # via effdet
onnx==1.19.1 onnx==1.19.1
# via # via
# -r ./extra-pdf-image.in # -r extra-pdf-image.in
# unstructured-inference # unstructured-inference
onnxruntime==1.23.2 onnxruntime==1.23.2
# via # via
# -r ./extra-pdf-image.in # -r extra-pdf-image.in
# unstructured-inference # unstructured-inference
opencv-python==4.12.0.88 opencv-python==4.12.0.88
# via unstructured-inference # via unstructured-inference
packaging==25.0 packaging==25.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# accelerate # accelerate
# huggingface-hub # huggingface-hub
# matplotlib # matplotlib
@ -143,16 +143,16 @@ packaging==25.0
pandas==2.3.3 pandas==2.3.3
# via unstructured-inference # via unstructured-inference
pdf2image==1.17.0 pdf2image==1.17.0
# via -r ./extra-pdf-image.in # via -r extra-pdf-image.in
pdfminer-six==20250327 pdfminer-six==20250327
# via # via
# -c /Users/luke/git/unstructured/requirements/deps/constraints.txt # -c deps/constraints.txt
# -r ./extra-pdf-image.in # -r extra-pdf-image.in
# unstructured-inference # unstructured-inference
pi-heif==1.1.1 pi-heif==1.1.1
# via -r ./extra-pdf-image.in # via -r extra-pdf-image.in
pikepdf==10.0.0 pikepdf==10.0.2
# via -r ./extra-pdf-image.in # via -r extra-pdf-image.in
pillow==12.0.0 pillow==12.0.0
# via # via
# matplotlib # matplotlib
@ -165,9 +165,9 @@ proto-plus==1.26.1
# via # via
# google-api-core # google-api-core
# google-cloud-vision # google-cloud-vision
protobuf==6.33.0 protobuf==6.33.1
# via # via
# -c /Users/luke/git/unstructured/requirements/deps/constraints.txt # -c deps/constraints.txt
# google-api-core # google-api-core
# google-cloud-vision # google-cloud-vision
# googleapis-common-protos # googleapis-common-protos
@ -177,7 +177,7 @@ protobuf==6.33.0
# proto-plus # proto-plus
psutil==7.1.3 psutil==7.1.3
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# accelerate # accelerate
pyasn1==0.6.1 pyasn1==0.6.1
# via # via
@ -189,19 +189,19 @@ pycocotools==2.0.10
# via effdet # via effdet
pycparser==2.23 pycparser==2.23
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# cffi # cffi
pyparsing==3.2.5 pyparsing==3.2.5
# via matplotlib # via matplotlib
pypdf==6.1.3 pypdf==6.3.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# -r ./extra-pdf-image.in # -r extra-pdf-image.in
pypdfium2==5.0.0 pypdfium2==5.0.0
# via unstructured-inference # via unstructured-inference
python-dateutil==2.9.0.post0 python-dateutil==2.9.0.post0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# matplotlib # matplotlib
# pandas # pandas
python-multipart==0.0.20 python-multipart==0.0.20
@ -217,21 +217,21 @@ pyyaml==6.0.3
# transformers # transformers
rapidfuzz==3.14.3 rapidfuzz==3.14.3
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# unstructured-inference # unstructured-inference
regex==2025.11.3 regex==2025.11.3
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# transformers # transformers
requests==2.32.5 requests==2.32.5
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# google-api-core # google-api-core
# huggingface-hub # huggingface-hub
# transformers # transformers
rsa==4.9.1 rsa==4.9.1
# via google-auth # via google-auth
safetensors==0.6.2 safetensors==0.7.0
# via # via
# accelerate # accelerate
# timm # timm
@ -240,7 +240,7 @@ scipy==1.15.3
# via unstructured-inference # via unstructured-inference
six==1.17.0 six==1.17.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# python-dateutil # python-dateutil
sympy==1.14.0 sympy==1.14.0
# via # via
@ -252,29 +252,29 @@ timm==1.0.22
# unstructured-inference # unstructured-inference
tokenizers==0.21.4 tokenizers==0.21.4
# via # via
# -c /Users/luke/git/unstructured/requirements/deps/constraints.txt # -c deps/constraints.txt
# transformers # transformers
torch==2.9.0 torch==2.9.1
# via # via
# accelerate # accelerate
# effdet # effdet
# timm # timm
# torchvision # torchvision
# unstructured-inference # unstructured-inference
torchvision==0.24.0 torchvision==0.24.1
# via # via
# effdet # effdet
# timm # timm
tqdm==4.67.1 tqdm==4.67.1
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# huggingface-hub # huggingface-hub
# transformers # transformers
transformers==4.55.4 transformers==4.55.4
# via unstructured-inference # via unstructured-inference
typing-extensions==4.15.0 typing-extensions==4.15.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# cryptography # cryptography
# grpcio # grpcio
# huggingface-hub # huggingface-hub
@ -283,16 +283,16 @@ typing-extensions==4.15.0
# torch # torch
tzdata==2025.2 tzdata==2025.2
# via pandas # via pandas
unstructured-inference==1.1.1 unstructured-inference==1.1.2
# via -r ./extra-pdf-image.in # via -r extra-pdf-image.in
unstructured-pytesseract==0.3.15 unstructured-pytesseract==0.3.15
# via -r ./extra-pdf-image.in # via -r extra-pdf-image.in
urllib3==2.5.0 urllib3==2.5.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# -c /Users/luke/git/unstructured/requirements/deps/constraints.txt # -c deps/constraints.txt
# requests # requests
wrapt==2.0.0 wrapt==2.0.1
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# deprecated # deprecated

View File

@ -2,14 +2,14 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./extra-pptx.in # pip-compile --no-strip-extras ./extra-pptx.in
# #
lxml==6.0.2 lxml==6.0.2
# via python-pptx # via python-pptx
pillow==12.0.0 pillow==12.0.0
# via python-pptx # via python-pptx
python-pptx==1.0.2 python-pptx==1.0.2
# via -r ./extra-pptx.in # via -r extra-pptx.in
typing-extensions==4.15.0 typing-extensions==4.15.0
# via python-pptx # via python-pptx
xlsxwriter==3.2.9 xlsxwriter==3.2.9

View File

@ -2,15 +2,15 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./extra-xlsx.in # pip-compile --no-strip-extras ./extra-xlsx.in
# #
cffi==2.0.0 cffi==2.0.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# cryptography # cryptography
cryptography==46.0.3 cryptography==46.0.3
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# msoffcrypto-tool # msoffcrypto-tool
et-xmlfile==2.0.0 et-xmlfile==2.0.0
# via openpyxl # via openpyxl
@ -20,11 +20,11 @@ networkx==3.4.2
# via -r extra-xlsx.in # via -r extra-xlsx.in
numpy==2.2.6 numpy==2.2.6
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# pandas # pandas
olefile==0.47 olefile==0.47
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# msoffcrypto-tool # msoffcrypto-tool
openpyxl==3.1.5 openpyxl==3.1.5
# via -r extra-xlsx.in # via -r extra-xlsx.in
@ -32,21 +32,21 @@ pandas==2.3.3
# via -r extra-xlsx.in # via -r extra-xlsx.in
pycparser==2.23 pycparser==2.23
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# cffi # cffi
python-dateutil==2.9.0.post0 python-dateutil==2.9.0.post0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# pandas # pandas
pytz==2025.2 pytz==2025.2
# via pandas # via pandas
six==1.17.0 six==1.17.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# python-dateutil # python-dateutil
typing-extensions==4.15.0 typing-extensions==4.15.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# cryptography # cryptography
tzdata==2025.2 tzdata==2025.2
# via pandas # via pandas

View File

@ -2,19 +2,19 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./huggingface.in # pip-compile --no-strip-extras ./huggingface.in
# #
certifi==2025.10.5 certifi==2025.11.12
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# requests # requests
charset-normalizer==3.4.4 charset-normalizer==3.4.4
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# requests # requests
click==8.3.0 click==8.3.1
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# sacremoses # sacremoses
filelock==3.20.0 filelock==3.20.0
# via # via
@ -33,18 +33,18 @@ huggingface-hub==0.36.0
# transformers # transformers
idna==3.11 idna==3.11
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# requests # requests
jinja2==3.1.6 jinja2==3.1.6
# via torch # via torch
joblib==1.5.2 joblib==1.5.2
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# sacremoses # sacremoses
langdetect==1.0.9 langdetect==1.0.9
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# -r ./huggingface.in # -r huggingface.in
markupsafe==3.0.3 markupsafe==3.0.3
# via jinja2 # via jinja2
mpmath==1.3.0 mpmath==1.3.0
@ -53,11 +53,11 @@ networkx==3.4.2
# via torch # via torch
numpy==2.2.6 numpy==2.2.6
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# transformers # transformers
packaging==25.0 packaging==25.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# huggingface-hub # huggingface-hub
# transformers # transformers
pyyaml==6.0.3 pyyaml==6.0.3
@ -66,47 +66,47 @@ pyyaml==6.0.3
# transformers # transformers
regex==2025.11.3 regex==2025.11.3
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# sacremoses # sacremoses
# transformers # transformers
requests==2.32.5 requests==2.32.5
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# huggingface-hub # huggingface-hub
# transformers # transformers
sacremoses==0.1.1 sacremoses==0.1.1
# via -r ./huggingface.in # via -r huggingface.in
safetensors==0.6.2 safetensors==0.7.0
# via transformers # via transformers
sentencepiece==0.2.1 sentencepiece==0.2.1
# via -r ./huggingface.in # via -r huggingface.in
six==1.17.0 six==1.17.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# langdetect # langdetect
sympy==1.14.0 sympy==1.14.0
# via torch # via torch
tokenizers==0.21.4 tokenizers==0.21.4
# via # via
# -c /Users/luke/git/unstructured/requirements/deps/constraints.txt # -c deps/constraints.txt
# transformers # transformers
torch==2.9.0 torch==2.9.1
# via -r ./huggingface.in # via -r huggingface.in
tqdm==4.67.1 tqdm==4.67.1
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# huggingface-hub # huggingface-hub
# sacremoses # sacremoses
# transformers # transformers
transformers==4.55.4 transformers==4.55.4
# via -r ./huggingface.in # via -r huggingface.in
typing-extensions==4.15.0 typing-extensions==4.15.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# huggingface-hub # huggingface-hub
# torch # torch
urllib3==2.5.0 urllib3==2.5.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# -c /Users/luke/git/unstructured/requirements/deps/constraints.txt # -c deps/constraints.txt
# requests # requests

View File

@ -2,54 +2,54 @@
# This file is autogenerated by pip-compile with Python 3.10 # This file is autogenerated by pip-compile with Python 3.10
# by the following command: # by the following command:
# #
# pip-compile ./test.in # pip-compile --no-strip-extras ./test.in
# #
annotated-types==0.7.0 annotated-types==0.7.0
# via pydantic # via pydantic
autoflake==2.3.1 autoflake==2.3.1
# via -r ./test.in # via -r test.in
black==25.9.0 black==25.11.0
# via -r ./test.in # via -r test.in
click==8.3.0 click==8.3.1
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# black # black
coverage[toml]==7.11.0 coverage[toml]==7.12.0
# via # via
# -r ./test.in # -r test.in
# pytest-cov # pytest-cov
exceptiongroup==1.3.0 exceptiongroup==1.3.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# pytest # pytest
execnet==2.1.1 execnet==2.1.2
# via pytest-xdist # via pytest-xdist
flake8==7.3.0 flake8==7.3.0
# via # via
# -r ./test.in # -r test.in
# flake8-print # flake8-print
flake8-print==5.0.0 flake8-print==5.0.0
# via -r ./test.in # via -r test.in
freezegun==1.5.5 freezegun==1.5.5
# via -r ./test.in # via -r test.in
grpcio==1.76.0 grpcio==1.76.0
# via -r ./test.in # via -r test.in
iniconfig==2.3.0 iniconfig==2.3.0
# via pytest # via pytest
liccheck==0.9.2 liccheck==0.9.2
# via -r ./test.in # via -r test.in
mccabe==0.7.0 mccabe==0.7.0
# via flake8 # via flake8
mypy==1.18.2 mypy==1.18.2
# via -r ./test.in # via -r test.in
mypy-extensions==1.1.0 mypy-extensions==1.1.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# black # black
# mypy # mypy
packaging==25.0 packaging==25.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# black # black
# pytest # pytest
pathspec==0.12.1 pathspec==0.12.1
@ -67,7 +67,7 @@ pycodestyle==2.14.0
# flake8 # flake8
# flake8-print # flake8-print
pydantic==2.12.4 pydantic==2.12.4
# via -r ./test.in # via -r test.in
pydantic-core==2.41.5 pydantic-core==2.41.5
# via pydantic # via pydantic
pyflakes==3.4.0 pyflakes==3.4.0
@ -76,30 +76,30 @@ pyflakes==3.4.0
# flake8 # flake8
pygments==2.19.2 pygments==2.19.2
# via pytest # via pytest
pytest==8.4.2 pytest==9.0.1
# via # via
# pytest-cov # pytest-cov
# pytest-mock # pytest-mock
# pytest-xdist # pytest-xdist
pytest-cov==7.0.0 pytest-cov==7.0.0
# via -r ./test.in # via -r test.in
pytest-mock==3.15.1 pytest-mock==3.15.1
# via -r ./test.in # via -r test.in
pytest-xdist==3.8.0 pytest-xdist==3.8.0
# via -r ./test.in # via -r test.in
python-dateutil==2.9.0.post0 python-dateutil==2.9.0.post0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# freezegun # freezegun
pytokens==0.3.0 pytokens==0.3.0
# via black # via black
ruff==0.14.3 ruff==0.14.6
# via -r ./test.in # via -r test.in
semantic-version==2.10.0 semantic-version==2.10.0
# via liccheck # via liccheck
six==1.17.0 six==1.17.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# python-dateutil # python-dateutil
toml==0.10.2 toml==0.10.2
# via liccheck # via liccheck
@ -111,16 +111,16 @@ tomli==2.3.0
# mypy # mypy
# pytest # pytest
types-click==7.1.8 types-click==7.1.8
# via -r ./test.in # via -r test.in
types-markdown==3.9.0.20250906 types-markdown==3.10.0.20251106
# via -r ./test.in # via -r test.in
types-requests==2.32.4.20250913 types-requests==2.32.4.20250913
# via -r ./test.in # via -r test.in
types-tabulate==0.9.0.20241207 types-tabulate==0.9.0.20241207
# via -r ./test.in # via -r test.in
typing-extensions==4.15.0 typing-extensions==4.15.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# black # black
# exceptiongroup # exceptiongroup
# grpcio # grpcio
@ -132,6 +132,6 @@ typing-inspection==0.4.2
# via pydantic # via pydantic
urllib3==2.5.0 urllib3==2.5.0
# via # via
# -c /Users/luke/git/unstructured/requirements/base.txt # -c base.txt
# -c /Users/luke/git/unstructured/requirements/deps/constraints.txt # -c deps/constraints.txt
# types-requests # types-requests

View File

@ -1 +1 @@
__version__ = "0.18.21-dev0" # pragma: no cover __version__ = "0.18.21" # pragma: no cover